SciCompMod
diff --git a/‎pycode/examples/epidata/ProgressIndicator.py‎
Lines changed: 14 additions & 9 deletions b/‎pycode/examples/epidata/ProgressIndicator.py‎
Lines changed: 14 additions & 9 deletions
diff --git a/‎pycode/memilio-epidata/memilio/epidata/getCaseData.py‎
Lines changed: 12 additions & 11 deletions b/‎pycode/memilio-epidata/memilio/epidata/getCaseData.py‎
Lines changed: 12 additions & 11 deletions
diff --git a/‎pycode/memilio-epidata/memilio/epidata/getCaseDatawithEstimations.py‎
Lines changed: 3 additions & 2 deletions b/‎pycode/memilio-epidata/memilio/epidata/getCaseDatawithEstimations.py‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎pycode/memilio-epidata/memilio/epidata/getCommuterMobility.py‎
Lines changed: 37 additions & 17 deletions b/‎pycode/memilio-epidata/memilio/epidata/getCommuterMobility.py‎
Lines changed: 37 additions & 17 deletions
diff --git a/‎pycode/memilio-epidata/memilio/epidata/getDIVIData.py‎
Lines changed: 2 additions & 1 deletion b/‎pycode/memilio-epidata/memilio/epidata/getDIVIData.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎pycode/memilio-epidata/memilio/epidata/getDataIntoPandasDataFrame.py‎
Lines changed: 39 additions & 23 deletions b/‎pycode/memilio-epidata/memilio/epidata/getDataIntoPandasDataFrame.py‎
Lines changed: 39 additions & 23 deletions
@@ -17,28 +17,33 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #############################################################################
-"""@ProgressIndicator.py
-WARNING: This file is currently not tested and maintained.
-"""
+
 from memilio import progress_indicator
 import time
 
 print("This is only a usage example, and does not actually do anything.")
+# Also, the following values for delay, sleep etc. are chosen arbitrary,
+# and have no further relevancy other than to demonstrate the indicator.
+
 # using start/stop
 p = progress_indicator.Dots(message="waiting", delay=0.5)
 p.start()
 time.sleep(1.6)
 p.stop()
-# using with as block
+
+# using with-as block
 with progress_indicator.Percentage(message="download 1", delay=0.4) as p:
     for i in range(13):
         time.sleep(0.1467)
-        p.set_progress((i+1)/13)
+        p.set_progress((i + 1) / 13)
+
 with progress_indicator.Percentage(message="download 2", use_bar=False,
-                delay=0, keep_output=False) as p:
+                                   delay=0, keep_output=False) as p:
     for i in range(97):
         time.sleep(0.0367)
-        p.set_progress((i+1)/97)
-# using with block ('as' is not usefull without Percentage)
+        p.set_progress((i + 1) / 97)
+
+# using with block
+# the 'as' is only required for calling e.g. message() or set_progress()
 with progress_indicator.Spinner(message="finish"):
-    time.sleep(2)
+    time.sleep(2)
@@ -327,15 +327,15 @@ def get_case_data(read_data=dd.defaultDict['read_data'],
             if dict_files[file][2] == None:
                 df_local_cs = df_local.cumsum().reset_index(drop=False)
             else:
-                df_local_cs = df_local.groupby(
-                    level=[dict_files[file][0].index(level_index) for level_index in dict_files[file][2]]).cumsum().reset_index()
+                df_local_cs = df_local.groupby(level=[dict_files[file][0].index(
+                    level_index) for level_index in dict_files[file][2]]).cumsum().reset_index()
 
             if impute_dates or moving_average > 0:
-                df_local_cs = mdfs.impute_and_reduce_df(df_local_cs,
-                                                        group_by_cols=dict_files[file][3],
-                                                        mod_cols=dict_files[file][4],
-                                                        impute='forward', moving_average=moving_average,
-                                                        min_date=start_date, max_date=end_date)
+                df_local_cs = mdfs.impute_and_reduce_df(
+                    df_local_cs, group_by_cols=dict_files[file][3],
+                    mod_cols=dict_files[file][4],
+                    impute='forward', moving_average=moving_average,
+                    min_date=start_date, max_date=end_date)
 
             df_local_cs = mdfs.extract_subframe_based_on_dates(
                 df_local_cs, start_date, end_date)
@@ -362,10 +362,11 @@ def get_case_data(read_data=dd.defaultDict['read_data'],
                     plt.show()
 
                 if file == 'all_gender':
-                    df.groupby(Geschlecht) \
-                        .agg({AnzahlFall: sum, AnzahlTodesfall: sum, AnzahlGenesen: sum}) \
-                        .plot(title='COVID-19 infections, deaths, recovered', grid=True,
-                              kind='bar')
+                    df.groupby(Geschlecht).agg(
+                        {AnzahlFall: sum, AnzahlTodesfall: sum,
+                         AnzahlGenesen: sum}).plot(
+                        title='COVID-19 infections, deaths, recovered',
+                        grid=True, kind='bar')
                     plt.tight_layout()
                     plt.show()
 
 
@@ -84,8 +84,9 @@ def get_case_data_with_estimations(
             rep_date)
 
         # get data from John Hopkins University
-        gjd.get_jh_data(read_data, file_format, out_folder, no_raw,
-                        start_date, end_date, impute_dates, moving_average, make_plot_jh)
+        gjd.get_jh_data(
+            read_data, file_format, out_folder, no_raw, start_date, end_date,
+            impute_dates, moving_average, make_plot_jh)
 
     # Now we now which data is generated and we can use it
     # read in jh data
 
@@ -183,8 +183,8 @@ def get_commuter_data(read_data=dd.defaultDict['read_data'],
     govkey2numlist = collections.OrderedDict(
         zip(govkey_list, list(range(0, len(govkey_list)))))
 
-    (countykey2govkey, countykey2localnumlist, gov_county_table, state_gov_table) = assign_geographical_entities(
-        countykey_list, govkey_list)
+    (countykey2govkey, countykey2localnumlist, gov_county_table,
+     state_gov_table) = assign_geographical_entities(countykey_list, govkey_list)
 
     mat_commuter_migration = np.zeros(
         [len(countykey_list), len(countykey_list)])
@@ -203,7 +203,6 @@ def get_commuter_data(read_data=dd.defaultDict['read_data'],
     n = 0
 
     for item in files:
-
         # Using the 'Einpendler' sheet to correctly distribute summed values over counties of other gov. region
         # This File is in a zip folder so it has to be unzipped first before it can be read.
         param_dict = {"sheet_name": 3, "engine": "pyxlsb"}
@@ -233,8 +232,8 @@ def get_commuter_data(read_data=dd.defaultDict['read_data'],
                 curr_county_migratedto = commuter_migration_file.iloc[i][1]
                 current_key = commuter_migration_file.iloc[i][0]
                 # migration to itself excluded!
-                counties_migratedfrom[countykey2govkey[current_key]
-                                      ][countykey2localnumlist[current_key]] = 1
+                counties_migratedfrom[countykey2govkey[current_key]][
+                    countykey2localnumlist[current_key]] = 1
 
             if not isinstance(commuter_migration_file.iloc[i][2], float):
                 # removal of nan's, regional keys are stored as strings
@@ -249,8 +248,8 @@ def get_commuter_data(read_data=dd.defaultDict['read_data'],
                         val = commuter_migration_file.iloc[i][4]
                         mat_commuter_migration[current_row, current_col] = val
                         checksum += val
-                        counties_migratedfrom[countykey2govkey[commuter_migration_file.iloc[i][2]]][
-                            countykey2localnumlist[commuter_migration_file.iloc[i][2]]] = 1
+                        counties_migratedfrom[countykey2govkey[commuter_migration_file.iloc[i][2]]
+                                              ][countykey2localnumlist[commuter_migration_file.iloc[i][2]]] = 1
 
                     # take summed values of other REMAINING counties of government region
                     # here, some counties of the region are stated explicitly and the rest is summed
@@ -265,15 +264,23 @@ def get_commuter_data(read_data=dd.defaultDict['read_data'],
                             # sum population of all counties not explicitly migrated from
                             # of the current gov region migrated from
                         dummy_pop_sum = 0
-                        for k in range(0, len(gov_county_table[govkey2numlist[dummy_key_wozeros]])):
+                        for k in range(
+                            0,
+                            len(
+                                gov_county_table
+                                [govkey2numlist[dummy_key_wozeros]])):
                             if counties_migratedfrom[govkey2numlist[dummy_key_wozeros]][k] < 1:
                                 # get identifier (0-401) for county key
                                 globindex = countykey2numlist[gov_county_table[govkey2numlist[dummy_key_wozeros]][k]]
                                 # sum up
                                 dummy_pop_sum += countypop_list[globindex]
 
                         # distribute emigration relatively to county population where migration comes from
-                        for k in range(0, len(gov_county_table[govkey2numlist[dummy_key_wozeros]])):
+                        for k in range(
+                            0,
+                            len(
+                                gov_county_table
+                                [govkey2numlist[dummy_key_wozeros]])):
                             if counties_migratedfrom[govkey2numlist[dummy_key_wozeros]][k] < 1:
                                 # get identifier (0-401) for county key
                                 globindex = countykey2numlist[gov_county_table[govkey2numlist[dummy_key_wozeros]][k]]
@@ -294,20 +301,32 @@ def get_commuter_data(read_data=dd.defaultDict['read_data'],
                         # sum population of all counties not explicitly migrated to
                         # of the current gov region migrated to
                         dummy_pop_sum = 0
-                        for k in range(0, len(gov_county_table[govkey2numlist[commuter_migration_file.iloc[i][2]]])):
+                        for k in range(
+                            0,
+                            len(
+                                gov_county_table
+                                [
+                                    govkey2numlist
+                                    [commuter_migration_file.iloc[i][2]]])):
                             if counties_migratedfrom[govkey2numlist[commuter_migration_file.iloc[i][2]]][k] < 1:
                                 # get identifier (0-401) for county key
-                                globindex = countykey2numlist[gov_county_table[govkey2numlist[
-                                    commuter_migration_file.iloc[i][2]]][k]]
+                                globindex = countykey2numlist[gov_county_table[
+                                    govkey2numlist[commuter_migration_file.iloc[i][2]]][k]]
                                 # sum up
                                 dummy_pop_sum += countypop_list[globindex]
 
                         # distribute emigration relatively to county population where migration comes from
-                        for k in range(0, len(gov_county_table[govkey2numlist[commuter_migration_file.iloc[i][2]]])):
+                        for k in range(
+                            0,
+                            len(
+                                gov_county_table
+                                [
+                                    govkey2numlist
+                                    [commuter_migration_file.iloc[i][2]]])):
                             if counties_migratedfrom[govkey2numlist[commuter_migration_file.iloc[i][2]]][k] < 1:
                                 # get identifier (0-401) for county key
-                                globindex = countykey2numlist[gov_county_table[govkey2numlist[
-                                    commuter_migration_file.iloc[i][2]]][k]]
+                                globindex = countykey2numlist[gov_county_table[
+                                    govkey2numlist[commuter_migration_file.iloc[i][2]]][k]]
                                 counties_migratedfrom[govkey2numlist[commuter_migration_file.iloc[i][2]]][k] = 1
 
                                 # set value computed relatively to county size and effective migration
@@ -567,8 +586,9 @@ def main():
 
     arg_dict_commuter = {**arg_dict, "setup_dict": setup_dict}
 
-    get_neighbors_mobility(1001, abs_tol=0, rel_tol=0, tol_comb='or',
-                           merge_eisenach=True, out_folder=dd.defaultDict['out_folder'])
+    get_neighbors_mobility(
+        1001, abs_tol=0, rel_tol=0, tol_comb='or', merge_eisenach=True,
+        out_folder=dd.defaultDict['out_folder'])
 
     get_commuter_data(**arg_dict_commuter)
 
 
@@ -86,7 +86,8 @@ def get_divi_data(read_data=dd.defaultDict['read_data'],
     # First csv data on 24-04-2020
     if start_date < date(2020, 4, 24):
         print("Warning: First data available on 2020-04-24. "
-              "You asked for " + start_date.strftime("%Y-%m-%d") + ". Changed it to 2020-04-24.")
+              "You asked for " + start_date.strftime("%Y-%m-%d") +
+              ". Changed it to 2020-04-24.")
         start_date = date(2020, 4, 24)
 
     directory = os.path.join(out_folder, 'Germany/')
 
@@ -55,7 +55,9 @@ def user_choice(message, default=False):
             print("Please answer with y (yes) or n (no)")
 
 
-def download_file(url, chunk_size=1024, timeout=None, progress_function=None, verify=True, interactive=True):
+def download_file(
+        url, chunk_size=1024, timeout=None, progress_function=None,
+        verify=True):
     """! Download a file using GET over HTTP.
 
     @param url Full url of the file to download.
@@ -67,19 +69,22 @@ def download_file(url, chunk_size=1024, timeout=None, progress_function=None, ve
     @param timeout Timeout in seconds for the GET request.
     @param progress_function Function called regularly, with the current
         download progress in [0,1] as a float argument.
-    @param interactive bool. Whether to ask for user input. If False, raises Errors instead.
+    @param verify bool or "interactive". If False, ignores the connection's
+        security. If True, only downloads from secure connections are made,
+        and insecure connections raise a FileNotFoundError. If "interactive",
+        prompts the user whether or not to allow insecure connections. 
     @return File as BytesIO
     """
-    if verify == False:
-        # suppress this warning since the insecure requests is intentional
-        urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
     # send GET request as stream so the content is not downloaded at once
     try:
-        req = requests.get(url, stream=True, timeout=timeout, verify=verify)
+        req = requests.get(
+            url, stream=True, timeout=timeout,
+            verify=verify == True or verify == "interactive")
     except OSError:
-        if interactive and user_choice(url + " could not be opened due to an "
-                                       "unsecure connection. Do you want to "
-                                       "open it anyways?\n"):
+        if verify == "interactive" and user_choice(
+            url +
+            " could not be opened due to an insecure connection. "
+                "Do you want to open it anyways?\n"):
             urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
             req = requests.get(url, stream=True, timeout=timeout, verify=False)
         else:
@@ -132,12 +137,15 @@ def extract_zip(file, **param_dict):
     return all_dfs
 
 
-def get_file(filepath='', url='', read_data=dd.defaultDict['read_data'], param_dict={}, interactive=True):
+def get_file(
+        filepath='', url='', read_data=dd.defaultDict['read_data'],
+        param_dict={},
+        interactive=True):
     """! Loads data from filepath and stores it in a pandas dataframe.
-    If data can't be read from given filepath the user is asked wether the file should be downloaded from the given url or not.
+    If data can't be read from given filepath the user is asked whether the file should be downloaded from the given url or not.
     Uses the progress indicator to give feedback.
 
-    @param filepath String. Filepath where data es read from.
+    @param filepath String. Filepath from where the data is read.
     @param url String. URL to download the dataset.
     @param read_data True or False. Defines if item is opened from directory (True) or downloaded (False).
     @param param_dct Dict. Additional information for download functions (e.g. engine, sheet_name, header...)
@@ -149,18 +157,22 @@ def get_file(filepath='', url='', read_data=dd.defaultDict['read_data'], param_d
     param_dict_csv = {"sep": ',', "header": 0, "encoding": None, 'dtype': None}
     param_dict_zip = {}
 
-    filetype_dict = {'text': pd.read_csv, 'Composite Document File V2 Document': pd.read_excel,
-                     'Excel': pd.read_excel, 'Zip': extract_zip}
-    param_dict_dict = {pd.read_csv: param_dict_csv,
-                       pd.read_excel: param_dict_excel, extract_zip: param_dict_zip}
+    filetype_dict = {
+        'text': pd.read_csv,
+        'Composite Document File V2 Document': pd.read_excel,
+        'Excel': pd.read_excel, 'Zip': extract_zip}
+    param_dict_dict = {
+        pd.read_csv: param_dict_csv, pd.read_excel: param_dict_excel,
+        extract_zip: param_dict_zip}
 
     if read_data:
         try:
             df = pd.read_json(filepath)
         except FileNotFoundError:
-            if interactive and user_choice("Warning: The file: " + filepath +
-                                           " does not exist in the directory. Do you want to download "
-                                           "the file from " + url + " instead?\n"):
+            if interactive and user_choice(
+                "Warning: The file: " + filepath +
+                " does not exist in the directory. Do you want to download "
+                    "the file from " + url + " instead?\n"):
                 df = get_file(filepath=filepath, url=url,
                               read_data=False, param_dict={})
             else:
@@ -173,14 +185,16 @@ def get_file(filepath='', url='', read_data=dd.defaultDict['read_data'], param_d
             try:  # to download file from url and show download progress
                 with progress_indicator.Percentage(message="Downloading " + url) as p:
                     file = download_file(
-                        url, 1024, None, p.set_progress, interactive=interactive)
+                        url, 1024, None, p.set_progress,
+                        verify="interactive" if interactive else True)
                     # read first 2048 bytes to find file type
                     ftype = magic.from_buffer(file.read(2048))
                     # set pointer back to starting position
                     file.seek(0)
                     # find file type in dict and use function to read
-                    func_to_use = [val for key,
-                                   val in filetype_dict.items() if key in ftype]
+                    func_to_use = [
+                        val for key, val in filetype_dict.items()
+                        if key in ftype]
                     # use different default dict for different functions
                     dict_to_use = param_dict_dict[func_to_use[0]]
                     # adjust dict
@@ -330,7 +344,9 @@ def cli(what):
     return vars(args)
 
 
-def append_filename(filename='', impute_dates=False, moving_average=0, split_berlin=False, rep_date=False):
+def append_filename(
+        filename='', impute_dates=False, moving_average=0, split_berlin=False,
+        rep_date=False):
     """! Creates consistent file names for all output.
     """
     # split_berlin and repdate especially for case data