MadAnalysis · kfan326 · Jul 1, 2022 · Jul 7, 2022 · Jul 23, 2022 · Jul 24, 2022
diff --git a/doc/releases/changelog-dev.md b/doc/releases/changelog-dev.md
@@ -6,6 +6,14 @@
 
 ## Bug fixes
 
+ * Fixed destructor in `RegionSelectionManager` so that `RegionSelection` 
+   objects allocated inside the `region_vector` are properly destructed upon 
+   existing `scope/destruction` of `RegionSelectionManager`.
+   ([#113](https://github.com/MadAnalysis/madanalysis5/pull/113))
+
+
 ## Contributors
 
-This release contains contributions from (in alphabetical order):
+This release contains contributions from (in alphabetical order):
+
+[Kyle Fan](https://github.com/kfan326)
diff --git a/madanalysis/IOinterface/job_reader.py b/madanalysis/IOinterface/job_reader.py
diff --git a/madanalysis/IOinterface/job_writer.py b/madanalysis/IOinterface/job_writer.py
@@ -750,6 +750,7 @@ def WriteMakefiles(self, option="", **kwargs):
 
         options.has_root_inc       = self.main.archi_info.has_root
         options.has_root_lib       = self.main.archi_info.has_root
+        options.has_sqlite         = self.main.archi_info.has_sqlite3
         #options.has_userpackage = True
         toRemove=['Log/compilation.log','Log/linking.log','Log/cleanup.log','Log/mrproper.log']
 

diff --git a/madanalysis/IOinterface/library_writer.py b/madanalysis/IOinterface/library_writer.py
@@ -131,7 +131,7 @@ def WriteMakefileForInterfaces(self,package):
             filename = self.path+"/SampleAnalyzer/Test/Makefile_delphesMA5tune"
         elif package=='test_root':
             filename = self.path+"/SampleAnalyzer/Test/Makefile_root"
-
+       
         # Header
         title=''
         if package=='commons':
@@ -239,10 +239,13 @@ def WriteMakefileForInterfaces(self,package):
             options.ma5_fastjet_mode   = self.main.archi_info.has_fastjet
             options.has_fastjet_inc    = self.main.archi_info.has_fastjet
             options.has_fastjet_lib    = self.main.archi_info.has_fastjet
+            #options.has_sqlite_lib     = self.main.archi_info.has_sqlite3
+            options.has_sqlite_tag     = self.main.archi_info.has_sqlite3
             # options.has_fastjet_ma5lib = self.main.archi_info.has_fastjet
             toRemove.extend(['compilation.log','linking.log','cleanup.log','mrproper.log'])
         elif package=='test_commons':
             options.has_commons  = True
+            options.has_sqlite_tag = self.main.archi_info.has_sqlite3
             toRemove.extend(['compilation_commons.log','linking_commons.log','cleanup_commons.log','mrproper_commons.log','../Bin/TestCommons.log'])
         elif package=='zlib':
             options.has_commons  = True
@@ -252,6 +255,7 @@ def WriteMakefileForInterfaces(self,package):
         elif package=='test_zlib':
             options.has_commons     = True
             options.has_zlib_ma5lib = True
+            options.has_sqlite_tag  = self.main.archi_info.has_sqlite3
           #  options.has_zlib_lib = True
             toRemove.extend(['compilation_zlib.log','linking_zlib.log','cleanup_zlib.log','mrproper_zlib.log','../Bin/TestZlib.log'])
         elif package=='delphes':
@@ -324,6 +328,8 @@ def WriteMakefileForInterfaces(self,package):
             options.has_fastjet_lib    = self.main.archi_info.has_fastjet
             options.ma5_fastjet_mode   = self.main.archi_info.has_fastjet
             options.has_substructure   = self.main.archi_info.has_fjcontrib and self.main.archi_info.has_fastjet
+            options.has_sqlite_tag     = self.main.archi_info.has_sqlite3
+            options.has_sqlite_lib     = self.main.archi_info.has_sqlite3
 
             toRemove.extend(['compilation.log','linking.log','cleanup.log','mrproper.log'])
         elif package=='test_process':
@@ -342,6 +348,8 @@ def WriteMakefileForInterfaces(self,package):
           #  options.has_delphesMA5tune_tag    = self.main.archi_info.has_delphesMA5tune
           #  options.has_zlib_tag              = self.main.archi_info.has_zlib
             toRemove.extend(['compilation_process.log','linking_process.log','cleanup_process.log','mrproper_process.log','../Bin/TestSampleAnalyzer.log'])
+        elif package=='sqlite':
+            options.has_sqlite              = self.main.archi_info.has_sqlite3
 
         # file pattern
         if package in ['commons','process','configuration']:
@@ -373,7 +381,7 @@ def WriteMakefileForInterfaces(self,package):
             hfiles   = ['DelphesMA5tune/*.h']
         elif package=='test_root':
             cppfiles = ['Root/*.cpp']
-            hfiles   = ['Root/*.h']
+            hfiles   = ['Root/*.h'] 
         else:
             cppfiles = [package+'/*.cpp']
             hfiles   = [package+'/*.h']

diff --git a/madanalysis/IOinterface/sqlite_reader.py b/madanalysis/IOinterface/sqlite_reader.py
@@ -0,0 +1,189 @@
+import sqlite3
+from matplotlib import pyplot as plt
+import numpy as np
+import math
+import statistics
+
+
+def getMeanAndStdevOld(path):
+
+    con = sqlite3.connect(path)
+    cursor = con.cursor()
+
+    bin_data = cursor.execute("select * from data;").fetchall()
+
+    pos_bins = dict()
+    neg_bins = dict()
+
+    ## bin_data has all data for the histogram, need to get mean and standard deviation for each bin
+    ## each row of the query is a tuple of 5 elements [histo name, weight id, bin #, positive value, negative value]
+    ## sort them into +bin/-bin[name] -> bin # -> [mean, standard deviation]
+
+    for row in bin_data:
+        ## if the histo name is not inside the bin dictionaries, create a new dictionary for each of +/- bin dictionary
+        ## append values to +/-bin[name][bin#]
+
+        if row[0] not in pos_bins or row[0] not in neg_bins:
+            pos_bins[row[0]] = dict()
+            neg_bins[row[0]] = dict()
+            pos_bins[row[0]][row[2]] = [float(row[3])]
+            neg_bins[row[0]][row[2]] = [float(row[4])]
+
+        else:
+            if row[2] in pos_bins[row[0]] or row[2] in neg_bins[row[0]]:
+                pos_bins[row[0]][row[2]].append(float(row[3]))
+                neg_bins[row[0]][row[2]].append(float(row[4]))
+            else :
+                pos_bins[row[0]][row[2]] = [float(row[3])]
+                neg_bins[row[0]][row[2]] = [float(row[4])]
+
+    output = dict()
+
+    for histo_name in pos_bins: 
+        output[histo_name] = dict()
+        for bin_i in pos_bins[histo_name]: 
+            output[histo_name][bin_i] = [statistics.mean(pos_bins[histo_name][bin_i]), statistics.stdev(pos_bins[histo_name][bin_i])]
+
+    for histo_name in neg_bins:
+        for bin_i in neg_bins[histo_name]: 
+            output[histo_name][bin_i].extend([statistics.mean(neg_bins[histo_name][bin_i]), statistics.stdev(neg_bins[histo_name][bin_i])])
+
+    return output
+
+
+def getStatistics(stats):
+    histoname_dict = dict()
+    for entry in stats:
+        if entry[0] not in histoname_dict:
+            histoname_dict[entry[0]] = dict()
+        histoname_dict[entry[0]][entry[1]] = float(entry[2]) - float(entry[3])
+    return histoname_dict
+
+
+def getMeanAndStdev(path):
+
+    con = sqlite3.connect(path)
+    cursor = con.cursor()
+    bin_data = cursor.execute("select * from data;").fetchall()
+    stats_data = cursor.execute("select name, id, pos_sum_event_weights_over_events, neg_sum_event_weights_over_events from Statistics").fetchall()
+
+    statsdict = getStatistics(stats_data)
+
+
+    ## parse data in the form of parsed_data[histo_name][bin #][{positive value, negative value}]
+    parsed_data = dict()
+    for row in bin_data:
+
+        histo_name = row[0]
+        weight_id = row[1]
+        bin_number = row[2]
+        sumw = statsdict[histo_name][str(weight_id)]
+        value = (float(row[3]) - abs(float(row[4]))) / sumw      
+        if histo_name not in parsed_data:
+            ## if histo name is not in the parsed_data dictionary, then create a new bin dictionary for that histo, then for the bin, create a weigh id dictionary
+            parsed_data[histo_name] = dict()
+            parsed_data[histo_name][bin_number] = []
+
+        else:
+            ## since histo name is in the parsed_data dictionary, we need to check if the bin in the dictioary, if not then create a weight id dictionary for that bin
+            if bin_number not in parsed_data[histo_name]:
+                parsed_data[histo_name][bin_number] = []
+
+        parsed_data[histo_name][bin_number].append(value)
+
+    output = dict()
+    for histo_name in parsed_data:
+        output[histo_name] = dict()
+        for bin_number in parsed_data[histo_name]:
+            output[histo_name][bin_number] = [statistics.mean(parsed_data[histo_name][bin_number]), statistics.stdev(parsed_data[histo_name][bin_number])]
+
+    return output
+
+def getHistoStatisticsAvg(path):
+
+    con = sqlite3.connect(path)
+    cursor = con.cursor()
+
+
+    statistics = cursor.execute("select name, avg(pos_num_events), avg(neg_num_events), avg(pos_sum_event_weights_over_events), avg(neg_sum_event_weights_over_events), avg(pos_entries), avg(neg_entries), avg(pos_sum_event_weights_over_entries), avg(neg_sum_event_weights_over_entries), avg(pos_sum_squared_weights), avg(neg_sum_squared_weights), avg(pos_value_times_weight), avg(neg_value_times_weight), avg(pos_value_squared_times_weight), avg(neg_value_squared_times_weight) from Statistics group by name;").fetchall()
+
+    statdict = dict()
+    for i in range(len(statistics)):
+        statdict[statistics[i][0]] = statistics[i][1:]
+
+    return statdict;
+
+
+
+
+
+
+## debug for printing out output dictionary
+## structure is as follows:
+## output[histogram_name][bin #] = [positive mean, positive stdev, negative mean, negative stddev]
+
+
+def DBreader_debug(output):
+
+    for name in output:
+        print(name)
+        for eachbin in output[name]:
+            print(eachbin)
+            for val in output[name][eachbin]:
+                print(val)
+
+
+    for histo in output:
+        num_of_keys = len(output[histo].keys())
+        labels = [None] * num_of_keys
+        for i in range(1,num_of_keys):
+            labels[i] = i
+        labels[0] = 'underflow'
+        labels[num_of_keys-1] = 'overflow'
+        positives = [None] * num_of_keys
+        negatives = [None] * num_of_keys
+        for row in output[histo]:
+            if(row == 'underflow'):
+                positives[0] = output[histo][row][0]
+                negatives[0] = output[histo][row][2]
+            elif(row == 'overflow'):
+                positives[num_of_keys-1] = output[histo][row][0]
+                negatives[num_of_keys-1] = output[histo][row][2]
+            else: 
+                positives[int(row)] = output[histo][row][0]
+                negatives[int(row)] = output[histo][row][2]
+        #for lable in lables:
+         #   print(lable)
+        #for val in positives:
+         #   print(val)
+        #for val in negatives:
+         #   print(val)
+        x = np.arange(num_of_keys)
+        width = 0.5
+        fig, ax = plt.subplots()
+        rects1 = ax.bar(x - width/3, positives, width, label="positives avg")
+        rects2 = ax.bar(x + width/3, negatives, width, label="negatives avg")
+
+        ax.set_ylabel('Events Luminosity = ')
+        ax.set_title(histo)
+        ax.set_xticks(x, labels, rotation = 65)
+        ax.legend() 
+
+        #ax.bar_label(rects1, padding=3)
+        #ax.bar_label(rects2, padding=3)
+
+        fig.tight_layout()
+        plt.show()
+
+
+
+
+
+
+
+
+
+
+
+
+
diff --git a/madanalysis/build/makefile_writer.py b/madanalysis/build/makefile_writer.py
@@ -41,6 +41,7 @@ def __init__(self):
             self.has_fastjet        = False
             self.has_delphes        = False
             self.has_delphesMA5tune = False
+            self.has_sqlite3        = False
 
 
     @staticmethod
@@ -98,7 +99,10 @@ def UserfriendlyMakefileForSampleAnalyzer(filename,options):
             file.write('\tcd Test && $(MAKE) -f Makefile_delphesMA5tune\n')
         if options.has_process:
             file.write('\tcd Process && $(MAKE) -f Makefile\n')
-            file.write('\tcd Test && $(MAKE) -f Makefile_process\n')
+            file.write('\tcd Test && $(MAKE) -f Makefile_process\n') 
+        if options.has_sqlite3:
+            file.write('\tcd Interfaces && $(MAKE) -f Makefile_sqlite\n')
+            file.write('\tcd Test && $(MAKE) -f Makefile_sqlite\n')
         file.write('\n')
 
         # Clean
@@ -125,6 +129,9 @@ def UserfriendlyMakefileForSampleAnalyzer(filename,options):
         if options.has_process:
             file.write('\tcd Process && $(MAKE) -f Makefile clean\n')
             file.write('\tcd Test && $(MAKE) -f Makefile_process clean\n')
+        if options.has_sqlite3:
+            file.write('\tcd Interfaces && $(MAKE) -f Makefile_sqlite clean\n')
+            file.write('\tcd Test && $(MAKE) -f Makefile_sqlite clean\n')
         file.write('\n')
 
         # Mrproper
@@ -152,6 +159,9 @@ def UserfriendlyMakefileForSampleAnalyzer(filename,options):
         if options.has_process:
             file.write('\tcd Process && $(MAKE) -f Makefile mrproper\n')
             file.write('\tcd Test && $(MAKE) -f Makefile_process mrproper\n')
+        if options.has_sqlite3:
+            file.write('\tcd Interfaces && $(MAKE) -f Makefile_sqlite mrproper\n')
+            file.write('\tcd Test && $(MAKE) -f Makefile_sqlite mrproper\n')
         file.write('\n')
 
         # Closing the file
@@ -194,6 +204,9 @@ def __init__(self):
             self.has_root_tag              = False
             self.has_root_lib              = False
             self.has_root_ma5lib           = False
+            self.has_sqlite                = False
+            self.has_sqlite_tag            = False
+            self.has_sqlite_lib            = False
 
 
 
@@ -321,7 +334,9 @@ def Makefile(
             for header in archi_info.delphesMA5tune_inc_paths:
                 cxxflags.extend(['-I'+header])
             file.write('CXXFLAGS += '+' '.join(cxxflags)+'\n')
-
+
+
+
         # - tags
         cxxflags=[]
         if options.has_root_tag:
@@ -338,6 +353,8 @@ def Makefile(
              cxxflags.extend(['-DDELPHES_USE'])
         if options.has_delphesMA5tune_tag:
              cxxflags.extend(['-DDELPHESMA5TUNE_USE'])
+        if options.has_sqlite_tag:
+            cxxflags.extend(['-DSQLITE3_USE'])
-        if options.has_sqlite_tag:
-            cxxflags.extend(['-DSQLITE3_USE'])
-        if options.has_sqlite_tag:
-            cxxflags.extend(['-DSQLITE3_USE'])
         if len(cxxflags)!=0:
             file.write('CXXFLAGS += '+' '.join(cxxflags)+'\n')
         file.write('\n')
@@ -347,7 +364,9 @@ def Makefile(
 
         # - general
         libs=[]
-        file.write('LIBFLAGS  = \n')
+
+        # added SQL
+        #file.write('LIBFLAGS  = -l sqlite3\n')
 
         # - commons
         if options.has_commons:
@@ -429,6 +448,14 @@ def Makefile(
         if options.has_heptoptagger:
             file.write('LIBFLAGS += -lHEPTopTagger_for_ma5\n')
 
+        # SQLite3
+        if options.has_sqlite: 
+            file.write('LIBFLAGS += -l sqlite3\n')
-            file.write('LIBFLAGS += -l sqlite3\n')
+            file.write('LIBFLAGS += -lsqlite_for_ma5\n')
-            file.write('LIBFLAGS += -l sqlite3\n')
+            file.write('LIBFLAGS += -lsqlite_for_ma5\n')
+
+        if options.has_sqlite_lib: 
+            file.write('LIBFLAGS += -l sqlite_for_ma5\n')
+
+
         # - Commons
         if options.has_commons:
             libs=[]
@@ -464,6 +491,8 @@ def Makefile(
             libs.append('$(MA5_BASE)/tools/SampleAnalyzer/Lib/libsubstructure_for_ma5.so')
         if options.has_heptoptagger:
             libs.append('$(MA5_BASE)/tools/SampleAnalyzer/Lib/libHEPTopTagger_for_ma5.so')
+        if options.has_sqlite_lib: 
+            libs.append('$(MA5_BASE)/tools/SampleAnalyzer/Lib/libsqlite_for_ma5.so')
         if len(libs)!=0:
             file.write('# Requirements to check before building\n')
             for ind in range(0,len(libs)):

diff --git a/madanalysis/core/library_builder.py b/madanalysis/core/library_builder.py
@@ -80,6 +80,10 @@ def checkMA5(self):
             libraries.append(self.archi_info.ma5dir+'/tools/SampleAnalyzer/Lib/libdelphes_for_ma5.so')
         if self.archi_info.has_delphesMA5tune:
             libraries.append(self.archi_info.ma5dir+'/tools/SampleAnalyzer/Lib/libdelphesMA5tune_for_ma5.so')
+        if self.archi_info.has_sqlite3:
+            libraries.append(self.archi_info.ma5dir+'/tools/SampleAnalyzer/Lib/libsqlite_for_ma5.so')
+
+
         for library in libraries:
             if not os.path.isfile(library):
                 self.logger.debug('\t-> library '+ library + " not found.")