NeotomaDB
diff --git a/‎.gitignore‎
Lines changed: 12 additions & 0 deletions b/‎.gitignore‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎bash/newSteward.sh‎
Lines changed: 4 additions & 0 deletions b/‎bash/newSteward.sh‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎function/da/geopoliticalunits.sql‎
Lines changed: 24 additions & 0 deletions b/‎function/da/geopoliticalunits.sql‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎function/doi/02_ndbdata.sql‎
Lines changed: 2 additions & 2 deletions b/‎function/doi/02_ndbdata.sql‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎function/indexes/addingIndices.sql‎
Lines changed: 8 additions & 0 deletions b/‎function/indexes/addingIndices.sql‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎function/longgeoname_view.SQL‎ ‎function/longgeoname_view.sql‎function/longgeoname_view.SQL renamed to function/longgeoname_view.sql b/‎function/longgeoname_view.SQL‎ ‎function/longgeoname_view.sql‎function/longgeoname_view.SQL renamed to function/longgeoname_view.sql
diff --git a/‎helpers/figshareUpload/figshare_upload.py‎
Lines changed: 27 additions & 0 deletions b/‎helpers/figshareUpload/figshare_upload.py‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎helpers/figshareUpload/lib/__init__.py‎ b/‎helpers/figshareUpload/lib/__init__.py‎
diff --git a/‎helpers/figshareUpload/lib/figShare.py‎
Lines changed: 110 additions & 0 deletions b/‎helpers/figshareUpload/lib/figShare.py‎
Lines changed: 110 additions & 0 deletions
diff --git a/‎helpers/figshareUpload/lib/pgBackup.py‎
Lines changed: 32 additions & 0 deletions b/‎helpers/figshareUpload/lib/pgBackup.py‎
Lines changed: 32 additions & 0 deletions
@@ -6,3 +6,15 @@ ignore/*
 *.R
 
 helpers/dumps/
+
+.vscode/settings.json
+
+helpers/dumps2021-06-07/
+
+helpers/figshareUpload/lib/__pycache__/
+
+helpers/figshareUpload/settings.yaml
+
+helpers/settings.yaml
+
+fixGeorge.sh
@@ -18,6 +18,10 @@ display_help() {
     echo "   -t taxonomyexpert      Is the steward a taxonomy expert? [true|false]"
     echo "   -d database            Which database is the steward associate with?"
     echo
+    echo " The script assumes that you have a ~/.pgpass file that contains your password"
+    echo " information.  The file is described in detail on the Postgres documentation:"
+    echo " https://www.postgresql.org/docs/current/libpq-pgpass.html"
+    echo
     # echo some stuff here for the -a or --add-options
     exit 1
 }
 
@@ -0,0 +1,24 @@
+CREATE MATERIALIZED VIEW da.geopoliticalunits AS
+ SELECT DISTINCT sgp.geopoliticalid,
+    gpu.geopoliticalname,
+    gpu.rank,
+    gpu.highergeopoliticalid
+   FROM ndb.sitegeopolitical sgp
+     JOIN ndb.geopoliticalunits gpu ON gpu.geopoliticalid = sgp.geopoliticalid
+  ORDER BY gpu.geopoliticalname;
+
+CREATE INDEX geopolrank ON da.geopoliticalunits USING hash(rank);
+
+ CREATE OR REPLACE FUNCTION da.refresh_sitegeopol()
+ RETURNS TRIGGER LANGUAGE plpgsql
+ AS $$
+   BEGIN
+   REFRESH MATERIALIZED VIEW CONCURRENTLY da.geopoliticalunits;
+   RETURN NULL;
+END $$;
+
+CREATE TRIGGER da_geopol_trigger
+   AFTER INSERT OR UPDATE OR DELETE OR TRUNCATE
+   ON ndb.sitegeopolitical
+   FOR EACH STATEMENT
+EXECUTE PROCEDURE da.refresh_sitegeopol(); 
@@ -58,8 +58,8 @@ WITH dssamples AS (
 	)
 	SELECT
 	  ds.datasetid,
-		jsonb_build_object('dataset', dsinfo.dataset,
-	                    'samples', json_agg(dss.sampledata)) AS data
+	  dsinfo.dataset,
+		jsonb_build_object('samples', json_agg(dss.sampledata)) AS data
 	FROM
 	  ndb.datasets AS ds
 	  JOIN dssamples AS dss ON ds.datasetid = dss.datasetid
 
@@ -18,3 +18,11 @@ CREATE INDEX IF NOT EXISTS smpageyoung_idx ON ndb.sampleages USING btree(ageyoun
 CREATE INDEX IF NOT EXISTS      geoage_idx ON ndb.geochronology USING btree(age);
 
 CREATE INDEX IF NOT EXISTS      variableel ON ndb.variables USING btree(taxonid, variableelementid, variableunitsid);
+
+CREATE INDEX IF NOT EXISTS data_variable_idx ON ndb.data USING btree(variableid);
+CREATE INDEX IF NOT EXISTS data_sample_idx ON ndb.data USING btree(sampleid);
+
+CREATE INDEX IF NOT EXISTS sample_taxon_idx ON ndb.samples USING btree(taxonid);
+
+CREATE INDEX IF NOT EXISTS analysisunits_collunit_idx ON ndb.analysisunits USING btree(collectionunitid);
+CREATE INDEX IF NOT EXISTS analysisunits_facies_idx ON ndb.analysisunits USING btree(faciesid);
@@ -0,0 +1,27 @@
+import hashlib
+import json
+import requests
+from requests.exceptions import HTTPError
+import time
+import yaml
+from lib.pgBackup import backup_database
+import lib.figShare as fs
+
+# The following two functions are drawn from this code on StackOverflow:
+# https://stackoverflow.com/a/39999652/14302148
+
+token = '<insert access token here>'
+FILE_PATH = '/path/to/work/directory/cat.obj'
+
+TITLE = 'A 3D cat object model'
+
+article_id = fs.create_article(TITLE, token)
+
+# Then we upload the file.
+file_info = fs.initiate_new_upload(article_id, FILE_PATH, token)
+
+# Until here we used the figshare API; following lines use the figshare upload service API.
+fs.upload_parts(file_info=file_info, token=token, file_path=FILE_PATH)
+
+# We return to the figshare API to complete the file upload process.
+fs.complete_upload(article_id, file_info['id'])
@@ -0,0 +1,110 @@
+import hashlib
+import json
+import os
+import requests
+from requests.exceptions import HTTPError
+
+def raw_issue_request(method, url, token, data=None, binary=False):
+    headers = {'Authorization': 'token ' + token}
+    if data is not None and not binary:
+        data = json.dumps(data)
+    response = requests.request(method, url, headers=headers, data=data)
+    try:
+        response.raise_for_status()
+        try:
+            data = json.loads(response.content)
+        except ValueError:
+            data = response.content
+    except HTTPError as error:
+        print('Caught an HTTPError: %s', str(error))
+        print ('Body:\n', response.content)
+        raise
+
+    return data
+
+
+def issue_request(method, endpoint, 
+                  *args, **kwargs):
+    baseurl='https://api.figshare.com/v2/{endpoint}'
+    return raw_issue_request(method, baseurl.format(endpoint=endpoint), *args, **kwargs)
+
+
+def create_article(title, token):
+    data = {
+        'title': title  # You may add any other information about the article here as you wish.
+    }
+    result = issue_request('POST', 'account/articles', data=data)
+    print('Created article:', result['location'], '\n')
+
+    result = raw_issue_request('GET', result['location'], token)
+
+    return result['id']
+
+
+def list_files_of_article(article_id):
+    result = issue_request('GET', 'account/articles/{}/files'.format(article_id))
+    print('Listing files for article {}:'.format(article_id))
+    if result:
+        for item in result:
+            print('  {id} - {name}'.format(**item))
+    else:
+        print('  No files.')
+
+    print
+
+
+def get_file_check_data(file_name):
+    chunkSize = 1048576
+    with open(file_name, 'rb') as fin:
+        md5 = hashlib.md5()
+        size = 0
+        data = fin.read(chunkSize)
+        while data:
+            size += len(data)
+            md5.update(data)
+            data = fin.read(chunkSize)
+        return md5.hexdigest(), size
+
+
+def initiate_new_upload(article_id, file_name, token):
+    endpoint = 'account/articles/{}/files'
+    endpoint = endpoint.format(article_id)
+
+    md5, size = get_file_check_data(file_name)
+    data = {'name': os.path.basename(file_name),
+            'md5': md5,
+            'size': size}
+
+    result = issue_request('POST', endpoint, data=data)
+    print('Initiated file upload:', result['location'], '\n')
+
+    result = raw_issue_request('GET', result['location'], token)
+
+    return result
+
+
+def complete_upload(article_id, file_id):
+    issue_request('POST', 'account/articles/{}/files/{}'.format(article_id, file_id))
+
+
+def upload_parts(file_info, token, file_path):
+    url = '{upload_url}'.format(**file_info)
+    result = raw_issue_request('GET', url, token)
+
+    print('Uploading parts:')
+    with open(file_path, 'rb') as fin:
+        for part in result['parts']:
+            upload_part(file_info, fin, part, token)
+    print
+
+
+def upload_part(file_info, stream, part, token):
+    udata = file_info.copy()
+    udata.update(part)
+    url = '{upload_url}/{partNo}'.format(**udata)
+
+    stream.seek(part['startOffset'])
+    data = stream.read(part['endOffset'] - part['startOffset'] + 1)
+
+    raw_issue_request('PUT', url, token, data=data, binary=True)
+    print ('  Uploaded part {partNo} from {startOffset} to {endOffset}'.format(**part))
@@ -0,0 +1,32 @@
+import time
+import yaml
+import os
+
+def create_essentials():
+    settings = yaml.load(open("settings.yaml", 'r'), yaml.SafeLoader)
+    db_name = settings["db_name"]
+    db_user = settings["db_user"]
+    db_host = settings["db_host"]
+    db_port = settings["db_port"]
+    backup_path = settings["backup_path"]
+    filename = settings["filename"]
+    filename = filename + "-" + time.strftime("%Y%m%d") + ".backup"
+    command_str = str(db_host)+" -p "+str(db_port)+" -d "+db_name+" -U "+db_user
+    return command_str, backup_path, filename
+
+
+def backup_database(table_names=None):
+    command_str,backup_path,filename = create_essentials()
+    command_str = "pg_dump -h " + command_str
+
+    if table_names is not None:
+        for x in table_names:
+            command_str = command_str +" -t "+x
+
+    command_str = command_str + " -F c -b -v -f '"+backup_path+"/"+filename+"'"
+    try:
+        os.system(command_str)
+        print("Backup completed")
+    except Exception as e:
+        print("!!Problem occured!!")
+        print(e)