NREL · nmerket · Mar 9, 2021 · Jan 13, 2021 · Jan 19, 2021 · Jan 25, 2021
diff --git a/aws_demo_project.yml b/aws_demo_project.yml
@@ -1,6 +1,6 @@
 schema_version: 0.2
 stock_type: residential
-buildstock_directory: ../OpenStudio-BuildStock  # Relative to this file or absolute
+buildstock_directory: ../resstock  # Relative to this file or absolute
 project_directory: project_national  # Relative to buildstock_directory
 output_directory: ../demo_test_outputs
 weather_files_url: https://data.nrel.gov/system/files/128/ResStock_TMY3.zip
@@ -36,7 +36,9 @@ aws:
     bucket: resbldg-datasets
     prefix: testing/external_demo_project
   emr:
-    slave_instance_count: 1
+    manager_instance_type: m5.xlarge
+    worker_instance_type: r5.4xlarge
+    worker_instance_count: 1
   region: us-west-2
   use_spot: true
   batch_array_size: 4

diff --git a/buildstockbatch/aws/aws.py b/buildstockbatch/aws/aws.py
@@ -1486,14 +1486,14 @@ def create_emr_cluster_function(self):
                     {
                         'Market': 'SPOT' if self.batch_use_spot else 'ON_DEMAND',
                         'InstanceRole': 'MASTER',
-                        'InstanceType': self.emr_master_instance_type,
+                        'InstanceType': self.emr_manager_instance_type,
                         'InstanceCount': 1
                     },
                     {
                         'Market': 'SPOT' if self.batch_use_spot else 'ON_DEMAND',
                         'InstanceRole': 'CORE',
-                        'InstanceType': self.emr_slave_instance_type,
-                        'InstanceCount': self.emr_slave_instance_count
+                        'InstanceType': self.emr_worker_instance_type,
+                        'InstanceCount': self.emr_worker_instance_count
                     },
                 ],
                 'Ec2SubnetId': self.priv_vpc_subnet_id_1,
@@ -1667,8 +1667,8 @@ def validate_instance_types(project_file):
         ec2 = boto3_session.client('ec2')
         job_base = AwsJobBase('genericjobid', aws_config, boto3_session)
         instance_types_requested = set()
-        instance_types_requested.add(job_base.emr_master_instance_type)
-        instance_types_requested.add(job_base.emr_slave_instance_type)
+        instance_types_requested.add(job_base.emr_manager_instance_type)
+        instance_types_requested.add(job_base.emr_worker_instance_type)
         inst_type_resp = ec2.describe_instance_type_offerings(Filters=[{
             'Name': 'instance-type',
             'Values': list(instance_types_requested)

diff --git a/buildstockbatch/aws/awsbase.py b/buildstockbatch/aws/awsbase.py
@@ -177,9 +177,9 @@ def __init__(self, job_identifier, aws_config, boto3_session):
 
         # EMR
         emr_config = aws_config.get('emr', {})
-        self.emr_master_instance_type = emr_config.get('master_instance_type', 'm5.4xlarge')
-        self.emr_slave_instance_type = emr_config.get('slave_instance_type', 'r5.4xlarge')
-        self.emr_slave_instance_count = emr_config.get('slave_instance_count', 4)
+        self.emr_manager_instance_type = emr_config.get('manager_instance_type', 'm5.4xlarge')
+        self.emr_worker_instance_type = emr_config.get('worker_instance_type', 'r5.4xlarge')
+        self.emr_worker_instance_count = emr_config.get('worker_instance_count', 4)
         self.emr_cluster_security_group_name = f'{self.job_identifier}_emr_security_group'
         self.emr_cluster_name = f'{self.job_identifier}_emr_dask_cluster'
         self.emr_job_flow_role_name = f'{self.job_identifier}_emr_job_flow_role'

diff --git a/buildstockbatch/schemas/v0.1.yaml b/buildstockbatch/schemas/v0.1.yaml
@@ -33,9 +33,9 @@ aws-job-environment:
   memory: int(min=1024, required=False)
 
 aws-emr-spec:
-  master_instance_type: str(required=False)
-  slave_instance_type: str(required=False)
-  slave_instance_count: int(min=1, required=False)
+  manager_instance_type: str(required=False)
+  worker_instance_type: str(required=False)
+  worker_instance_count: int(min=1, required=False)
   dask_worker_vcores: int(min=1, required=False)
 
 hpc-spec:

diff --git a/buildstockbatch/schemas/v0.2.yaml b/buildstockbatch/schemas/v0.2.yaml
@@ -35,9 +35,9 @@ aws-job-environment:
   memory: int(min=1024, required=False)
 
 aws-emr-spec:
-  master_instance_type: str(required=False)
-  slave_instance_type: str(required=False)
-  slave_instance_count: int(min=1, required=False)
+  manager_instance_type: str(required=False)
+  worker_instance_type: str(required=False)
+  worker_instance_count: int(min=1, required=False)
   dask_worker_vcores: int(min=1, required=False)
 
 hpc-spec:

diff --git a/docs/project_defn.rst b/docs/project_defn.rst
@@ -354,9 +354,9 @@ on the `AWS Batch <https://aws.amazon.com/batch/>`_ service.
    subscription to receive further notification emails.
 *  ``emr``: Optional key to specify options for postprocessing using an EMR cluster. Generally the defaults should work fine.
 
-    * ``master_instance_type``: The `instance type`_ to use for the EMR master node. Default: ``m5.xlarge``.
-    * ``slave_instance_type``: The `instance type`_ to use for the EMR worker nodes. Default: ``r5.4xlarge``.
-    * ``slave_instance_count``: The number of worker nodes to use. Same as ``eagle.postprocessing.n_workers``. 
+    * ``manager_instance_type``: The `instance type`_ to use for the EMR master node. Default: ``m5.xlarge``.
+    * ``worker_instance_type``: The `instance type`_ to use for the EMR worker nodes. Default: ``r5.4xlarge``.
+    * ``worker_instance_count``: The number of worker nodes to use. Same as ``eagle.postprocessing.n_workers``. 
       Increase this for a large dataset. Default: 2.
     * ``dask_worker_vcores``: The number of cores for each dask worker. Increase this if your dask workers are running out of memory. Default: 2.
 *  ``job_environment``: Specifies the computing requirements for each simulation.

diff --git a/project_resstock_national.yml b/project_resstock_national.yml
@@ -48,7 +48,7 @@ eagle:
 #     bucket: resbldg-datasets
 #     prefix: testing/user_test
 #   emr:
-#     slave_instance_count: 1
+#     worker_instance_count: 1
 #   region: us-west-2
 #   use_spot: true
 #   batch_array_size: 10