nestauk
diff --git a/‎docs/source/nesta.core.schemas.rst
Lines changed: 1 addition & 0 deletions b/‎docs/source/nesta.core.schemas.rst
Lines changed: 1 addition & 0 deletions
diff --git a/‎docs/source/nesta.core.scripts.rst
Lines changed: 0 additions & 3 deletions b/‎docs/source/nesta.core.scripts.rst
Lines changed: 0 additions & 3 deletions
diff --git a/‎nesta/core/batchables/arxiv/arxiv_elasticsearch/run.py
Lines changed: 6 additions & 10 deletions b/‎nesta/core/batchables/arxiv/arxiv_elasticsearch/run.py
Lines changed: 6 additions & 10 deletions
diff --git a/‎nesta/core/batchables/crunchbase/crunchbase_elasticsearch/run.py
Lines changed: 5 additions & 9 deletions b/‎nesta/core/batchables/crunchbase/crunchbase_elasticsearch/run.py
Lines changed: 5 additions & 9 deletions
diff --git a/‎nesta/core/batchables/eurito/arxiv_eu/run.py
Lines changed: 3 additions & 5 deletions b/‎nesta/core/batchables/eurito/arxiv_eu/run.py
Lines changed: 3 additions & 5 deletions
diff --git a/‎nesta/core/batchables/eurito/crunchbase_eu/run.py renamed to ‎nesta/core/batchables/eurito/companies_eu/run.py
Lines changed: 1 addition & 4 deletions b/‎nesta/core/batchables/eurito/crunchbase_eu/run.py renamed to ‎nesta/core/batchables/eurito/companies_eu/run.py
Lines changed: 1 addition & 4 deletions
diff --git a/‎nesta/core/batchables/eurito/cordis_eu/run.py
Lines changed: 3 additions & 5 deletions b/‎nesta/core/batchables/eurito/cordis_eu/run.py
Lines changed: 3 additions & 5 deletions
diff --git a/‎nesta/core/batchables/eurito/patstat-eu/run.py
Lines changed: 0 additions & 128 deletions b/‎nesta/core/batchables/eurito/patstat-eu/run.py
Lines changed: 0 additions & 128 deletions
diff --git a/‎nesta/core/batchables/eurito/patstat_eu/run.py
Lines changed: 1 addition & 3 deletions b/‎nesta/core/batchables/eurito/patstat_eu/run.py
Lines changed: 1 addition & 3 deletions
diff --git a/‎nesta/core/batchables/health_data/nih_abstract_mesh_data/run.py
Lines changed: 1 addition & 3 deletions b/‎nesta/core/batchables/health_data/nih_abstract_mesh_data/run.py
Lines changed: 1 addition & 3 deletions
@@ -1 +1,2 @@
 .. include:: ../../nesta/core/schemas/README.rst
+.. include:: ../../nesta/core/schemas/tier_1/mappings/README.rst
@@ -1,4 +1 @@
-Scripts
-=======
-
 .. include:: ../../nesta/core/scripts/README.rst
@@ -20,7 +20,6 @@
 from datetime import datetime as dt
 
 from nesta.core.orms.orm_utils import db_session, get_mysql_engine
-from nesta.core.orms.orm_utils import load_json_from_pathstub
 from nesta.core.orms.orm_utils import object_to_dict
 from nesta.core.orms.arxiv_orm import Article
 from nesta.core.orms.grid_orm import Institute
@@ -76,10 +75,7 @@ def run():
     ngrammer = Ngrammer(database="production")
 
     # es setup
-    strans_kwargs={'filename':'arxiv.json',
-                   'from_key':'tier_0',
-                   'to_key':'tier_1',
-                   'ignore':['id']}
+    strans_kwargs={'filename':'arxiv.json', 'ignore':['id']}
     es = ElasticsearchPlus(hosts=es_host,
                            port=es_port,
                            aws_auth_region=aws_auth_region,
@@ -164,9 +160,9 @@ def run():
             countries = set(grid_countries[inst_id]
                             for inst_id in good_institutes
                             if inst_id in grid_countries)
-            row['categories'], _, _ = hierarchy_field(cats)
-            row['fos'], _, _ = hierarchy_field(fos)
-            row['countries'], _, _ = hierarchy_field(countries)
+            row['nested_categories'], _, _ = hierarchy_field(cats)
+            row['fields_of_study'], _, _ = hierarchy_field(fos)
+            row['nested_location'], _, _ = hierarchy_field(countries)
 
             # Pull out international institute info
             has_mn = any(is_multinational(inst,
@@ -216,8 +212,8 @@ def run():
 
     if 'BATCHPAR_outinfo' not in os.environ:
         from nesta.core.orms.orm_utils import setup_es
-        es, es_config = setup_es('dev', True, True,
-                                 dataset='arxiv')
+        es, es_config = setup_es(endpoint='arxlive', dataset='arxiv',
+                                 production=False, drop_and_recreate=True)                                 
         environ = {'batch_file': ('ArxivESTask-2019-09-19-'
                                   'False-1568888970724721.json'),
                    'config': ('/home/ec2-user/nesta-eu/nesta/'
 
@@ -58,12 +58,8 @@ def run():
     continent_lookup[None] = None
 
     # es setup
-    field_null_mapping = load_json_from_pathstub("tier_1/field_null_mappings/",
-                                                 "health_scanner.json")
-    strans_kwargs={'filename':'crunchbase_organisation_members.json',
-                   'from_key':'tier_0',
-                   'to_key':'tier_1',
-                   'ignore':['id']}
+    field_null_mapping = load_json_from_pathstub("health-scanner", "nulls.json")
+    strans_kwargs = {'filename': 'companies.json', 'ignore': ['id']}
     es = ElasticsearchPlus(hosts=es_host,
                            port=es_port,
                            aws_auth_region=aws_auth_region,
@@ -162,9 +158,9 @@ def run():
 
     if 'BATCHPAR_outinfo' not in os.environ:
         from nesta.core.orms.orm_utils import setup_es
-        es, es_config = setup_es('dev', True, True,
-                                 dataset='crunchbase',
-                                 aliases='health_scanner')
+        es, es_config = setup_es(production=False, endpoint='health-scanner',
+                                 dataset='companies',
+                                 drop_and_recreate=True)
 
         environ = {"AWSBATCHTEST": "",
                    'BATCHPAR_batch_file': 'crunchbase_to_es-15597291977144725.json', 
 
@@ -54,9 +54,7 @@ def run():
 
     # es setup
     logging.info('Connecting to ES')
-    strans_kwargs={'filename':'eurito/arxiv-eu.json',
-                   'from_key':'tier_0', 'to_key':'tier_1',
-                   'ignore':['id']}
+    strans_kwargs = {'filename': 'arxiv.json', 'ignore': ['id']}
     es = ElasticsearchPlus(hosts=es_host,
                            port=es_port,
                            aws_auth_region=aws_auth_region,
@@ -202,8 +200,8 @@ def run():
     set_log_level()
     if 'BATCHPAR_outinfo' not in os.environ:
         from nesta.core.orms.orm_utils import setup_es
-        es, es_config = setup_es('dev', True, True,
-                                 dataset='arxiv-eu')
+        es, es_config = setup_es(production=False, endpoint='eurito', 
+                                 dataset='arxiv', drop_and_recreate=True)
         environ = {'config': ('/home/ec2-user/nesta-eu/nesta/'
                               'core/config/mysqldb.config'),
                    'batch_file' : ('arxiv-eu_EURITO-ElasticsearchTask-'
 
@@ -61,10 +61,7 @@ def run():
     eu_countries = get_eu_countries()
 
     # es setup
-    strans_kwargs={'filename':'eurito/crunchbase-eu.json',
-                   'from_key':'tier_0',
-                   'to_key':'tier_1',
-                   'ignore':['id']}
+    strans_kwargs = {'filename': 'companies.json', 'ignore': ['id']}
     es = ElasticsearchPlus(hosts=es_host,
                            port=es_port,
                            aws_auth_region=aws_auth_region,
 
@@ -88,9 +88,7 @@ def run():
 
     # es setup
     logging.info('Connecting to ES')
-    strans_kwargs={'filename':'eurito/cordis-eu.json',
-                   'from_key':'tier_0', 'to_key':'tier_1',
-                   'ignore':['id']}
+    strans_kwargs = {'filename': 'cordis.json', 'ignore': ['id']}
     es = ElasticsearchPlus(hosts=es_host,
                            port=es_port,
                            aws_auth_region=aws_auth_region,
@@ -132,8 +130,8 @@ def run():
     if 'BATCHPAR_outinfo' not in os.environ:
         from nesta.core.orms.orm_utils import setup_es
         from nesta.core.luigihacks.misctools import find_filepath_from_pathstub
-        es, es_config = setup_es('dev', True, True,
-                                 dataset='cordis-eu')
+        es, es_config = setup_es(production=False, endpoint='eurito', 
+                                 dataset='cordis', drop_and_recreate=True)
         environ = {'config': find_filepath_from_pathstub('mysqldb.config'),
                    'batch_file' : ('cordis-eu_EURITO-ElasticsearchTask-'
                                    '2020-04-10-True-15865345336407135.json'),
 
@@ -63,9 +63,7 @@ def run():
 
     # es setup
     logging.info('Connecting to ES')
-    strans_kwargs={'filename':'eurito/patstat-eu.json',
-                   'from_key':'tier_0', 'to_key':'tier_1',
-                   'ignore':['id']}
+    strans_kwargs = {'filename': 'patstat.json', 'ignore': ['id']}
     es = ElasticsearchPlus(hosts=es_host,
                            port=es_port,
                            aws_auth_region=aws_auth_region,
 
@@ -68,9 +68,7 @@ def run():
     dupes = format_duplicate_map(dupes)
 
     # Set up elastic search connection
-    field_null_mapping = load_json_from_pathstub("tier_1/"
-                                                 "field_null_mappings/",
-                                                 "health_scanner.json")
+    field_null_mapping = load_json_from_pathstub("health-scanner", "nulls.json")
     es = ElasticsearchPlus(hosts=es_config['host'],
                            port=es_config['port'],
                            aws_auth_region=es_config['region'],
Original file line number	Diff line number	Diff line change
`@@ -1 +1,2 @@`
`1`	`1`	`.. include:: ../../nesta/core/schemas/README.rst`
	`2`	`+.. include:: ../../nesta/core/schemas/tier_1/mappings/README.rst`
-Original file line number
+Diff line change
@@ @@ -1,4 +1 @@ @@
 -Scripts
 -=======
+-
 .. include:: ../../nesta/core/scripts/README.rst