diff --git a/docs/dataartsstudio/umn/ALL_META.TXT.json b/docs/dataartsstudio/umn/ALL_META.TXT.json index b20a64fe8..cae8f523a 100644 --- a/docs/dataartsstudio/umn/ALL_META.TXT.json +++ b/docs/dataartsstudio/umn/ALL_META.TXT.json @@ -31,13 +31,13 @@ "search_title":"", "metedata":[ { + "prodname":"dataartsstudio", "opensource":"false;true", "isMulti":"no", "IsMulti":"No", "documenttype":"usermanual", - "IsBot":"yes", "isBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes" } ], "title":"What Is DataArts Studio?", @@ -54,13 +54,13 @@ "search_title":"", "metedata":[ { + "prodname":"dataartsstudio", "opensource":"false;true", "isMulti":"no", "IsMulti":"No", "documenttype":"usermanual", - "IsBot":"yes", "isBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes" } ], "title":"Basic Concepts", @@ -77,13 +77,13 @@ "search_title":"", "metedata":[ { + "prodname":"dataartsstudio", "opensource":"false;true", "isMulti":"no", "IsMulti":"No", "documenttype":"usermanual", - "IsBot":"yes", "isBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes" } ], "title":"Functions", @@ -100,13 +100,13 @@ "search_title":"", "metedata":[ { + "prodname":"dataartsstudio", "opensource":"false;true", "isMulti":"no", "IsMulti":"No", "documenttype":"usermanual", - "IsBot":"yes", "isBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes" } ], "title":"Advantages", @@ -123,13 +123,13 @@ "search_title":"", "metedata":[ { + "prodname":"dataartsstudio", "opensource":"false;true", "isMulti":"no", "IsMulti":"No", "documenttype":"usermanual", - "IsBot":"yes", "isBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes" } ], "title":"Application Scenarios", @@ -146,13 +146,13 @@ "search_title":"", "metedata":[ { + "prodname":"dataartsstudio", "opensource":"false;true", "isMulti":"no", "IsMulti":"No", "documenttype":"usermanual", - "IsBot":"yes", "isBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes" } ], "title":"Permission Management", @@ -169,13 +169,13 @@ "search_title":"", "metedata":[ { + "prodname":"dataartsstudio", "opensource":"false;true", "isMulti":"no", "IsMulti":"No", "documenttype":"usermanual", - "IsBot":"yes", "isBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes" } ], "title":"Permissions", @@ -186,19 +186,19 @@ "node_id":"dataartsstudio_07_006.xml", "product_code":"dataartsstudio", "code":"9", - "des":"The following table lists the recommended browser for logging in to DataArts Studio.Browser compatibilityBrowserRecommended VersionRecommended OSRemarksGoogle Chrome115, ", + "des":"The following table lists the recommended browser for logging in to DataArts Studio.Browser compatibilityBrowserRecommended VersionRecommended OSRemarksGoogle Chrome133, ", "doc_type":"usermanual", "kw":"Notes and Constraints,Service Overview,User Guide", "search_title":"", "metedata":[ { + "prodname":"dataartsstudio", "opensource":"false;true", "isMulti":"no", "IsMulti":"No", "documenttype":"usermanual", - "IsBot":"yes", "isBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes" } ], "title":"Notes and Constraints", @@ -215,314 +215,23 @@ "search_title":"", "metedata":[ { + "prodname":"dataartsstudio", "opensource":"false;true", "isMulti":"no", "IsMulti":"No", "documenttype":"usermanual", - "IsBot":"yes", "isBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes" } ], "title":"Related Services", "githuburl":"" }, - { - "uri":"dataartsstudio_12_0002.html", - "node_id":"dataartsstudio_12_0002.xml", - "product_code":"dataartsstudio", - "code":"11", - "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "doc_type":"usermanual", - "kw":"Preparations", - "search_title":"", - "metedata":[ - { - "prodname":"dataartsstudio", - "documenttype":"usermanual" - } - ], - "title":"Preparations", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0003.html", - "node_id":"dataartsstudio_01_0003.xml", - "product_code":"dataartsstudio", - "code":"12", - "des":"Before using DataArts Studio, you need to create a a cloud platform account, create a DataArts Studio instance, access the DataArts Studio instance console, manage worksp", - "doc_type":"usermanual", - "kw":"Preparations,Preparations,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"Preparations", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_1028.html", - "node_id":"dataartsstudio_01_1028.xml", - "product_code":"dataartsstudio", - "code":"13", - "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "doc_type":"usermanual", - "kw":"Creating DataArts Studio Instances", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"Creating DataArts Studio Instances", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0115.html", - "node_id":"dataartsstudio_01_0115.xml", - "product_code":"dataartsstudio", - "code":"14", - "des":"Only users who have the DARTS Administrator or Tenant Administrator permissions can create DataArts Studio instances or DataArts Studio incremental packages. To allow use", - "doc_type":"usermanual", - "kw":"Creating a DataArts Studio Basic Package,Creating DataArts Studio Instances,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"Creating a DataArts Studio Basic Package", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0119.html", - "node_id":"dataartsstudio_01_0119.xml", - "product_code":"dataartsstudio", - "code":"15", - "des":"DataArts Studio provides basic and incremental packages. If the basic package cannot meet your requirements, you can create an incremental package. Before you create an i", - "doc_type":"usermanual", - "kw":"(Optional) Creating a DataArts Studio Incremental Package,Creating DataArts Studio Instances,User Gu", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"(Optional) Creating a DataArts Studio Incremental Package", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0001.html", - "node_id":"dataartsstudio_01_0001.xml", - "product_code":"dataartsstudio", - "code":"16", - "des":"A DataArts Studio instance has been obtained. For details, see Creating a DataArts Studio Basic Package.If there are multiple DataArts Studio instances in the current reg", - "doc_type":"usermanual", - "kw":"Accessing the DataArts Studio Instance Console,Preparations,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"Accessing the DataArts Studio Instance Console", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0011.html", - "node_id":"dataartsstudio_01_0011.xml", - "product_code":"dataartsstudio", - "code":"17", - "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "doc_type":"usermanual", - "kw":"Managing a Workspace", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"Managing a Workspace", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0116.html", - "node_id":"dataartsstudio_01_0116.xml", - "product_code":"dataartsstudio", - "code":"18", - "des":"The system will create a default workspace and assign the admin role to you after you create a DataArts Studio instance. can use the default workspace or create a new wor", - "doc_type":"usermanual", - "kw":"Creating and Managing a Workspace,Managing a Workspace,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"Creating and Managing a Workspace", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0530.html", - "node_id":"dataartsstudio_01_0530.xml", - "product_code":"dataartsstudio", - "code":"19", - "des":"By default, job logs and DLI dirty data are stored in an OBS bucket named dlf-log-{project ID}. You can customize a log storage path. You can configure an OBS bucket glob", - "doc_type":"usermanual", - "kw":"(Optional) Changing the Job Log Storage Path,Managing a Workspace,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"(Optional) Changing the Job Log Storage Path", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0118.html", - "node_id":"dataartsstudio_01_0118.xml", - "product_code":"dataartsstudio", - "code":"20", - "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "doc_type":"usermanual", - "kw":"Authorizing Users to Use DataArts Studio", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"Authorizing Users to Use DataArts Studio", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0004.html", - "node_id":"dataartsstudio_01_0004.xml", - "product_code":"dataartsstudio", - "code":"21", - "des":"Identity and Access Management (IAM) can be used for fine-grained permissions management on your DataArts Studio resources. With IAM, you can:Create IAM users for employe", - "doc_type":"usermanual", - "kw":"Creating an IAM User and Assigning DataArts Studio Permissions,Authorizing Users to Use DataArts Stu", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"Creating an IAM User and Assigning DataArts Studio Permissions", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0120.html", - "node_id":"dataartsstudio_01_0120.xml", - "product_code":"dataartsstudio", - "code":"22", - "des":"For IAM users with the DARTS User permission, a workspace role determines their permissions in the workspace. Currently, five preset roles are available: admin, developer", - "doc_type":"usermanual", - "kw":"(Optional) Defining a Workspace Role,Authorizing Users to Use DataArts Studio,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"(Optional) Defining a Workspace Role", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0117.html", - "node_id":"dataartsstudio_01_0117.xml", - "product_code":"dataartsstudio", - "code":"23", - "des":"For IAM users with the DARTS User permission, a workspace role determines their permissions in the workspace. If you want to allow another IAM user with the DARTS User pe", - "doc_type":"usermanual", - "kw":"Adding a Member and Assigning a Role,Authorizing Users to Use DataArts Studio,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"Adding a Member and Assigning a Role", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0006.html", - "node_id":"dataartsstudio_01_0006.xml", - "product_code":"dataartsstudio", - "code":"24", - "des":"When using DataArts Studio, for example, when creating OBS links, calling APIs, or locating issues, you may need to obtain information such as access keys, project IDs, a", - "doc_type":"usermanual", - "kw":"(Optional) Obtaining Authentication Information,Preparations,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsMulti":"No", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"(Optional) Obtaining Authentication Information", - "githuburl":"" - }, { "uri":"dataartsstudio_12_0004.html", "node_id":"dataartsstudio_12_0004.xml", "product_code":"dataartsstudio", - "code":"25", + "code":"11", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"User Guide", @@ -537,123 +246,270 @@ "githuburl":"" }, { - "uri":"en-us_topic_0000002270846046.html", - "node_id":"en-us_topic_0000002270846046.xml", + "uri":"dataartsstudio_01_1028.html", + "node_id":"dataartsstudio_01_1028.xml", "product_code":"dataartsstudio", - "code":"26", + "code":"12", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Management Console", + "kw":"Creating and Configuring a DataArts Studio Instance", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Management Console", + "title":"Creating and Configuring a DataArts Studio Instance", "githuburl":"" }, { - "uri":"en-us_topic_0000002270788944.html", - "node_id":"en-us_topic_0000002270788944.xml", + "uri":"dataartsstudio_01_0115.html", + "node_id":"dataartsstudio_01_0115.xml", "product_code":"dataartsstudio", - "code":"27", - "des":"A tag is a key-value pair that identifies an instance. It consists of a key and a value.DataArts Studio instance tags can be used in the following scenarios:If there are ", + "code":"13", + "des":"Only users with DARTSAdministrator or Tenant Administrator permissions can create DataArts Studio instances or incremental packages.Users with Tenant Administrator permis", "doc_type":"usermanual", - "kw":"Tags,Management Console,User Guide", + "kw":"Creating a DataArts Studio Instance,Creating and Configuring a DataArts Studio Instance,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Tags", + "title":"Creating a DataArts Studio Instance", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0138.html", + "node_id":"dataartsstudio_01_0138.xml", + "product_code":"dataartsstudio", + "code":"14", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "doc_type":"usermanual", + "kw":"Creating a DataArts Studio Incremental Package", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Creating a DataArts Studio Incremental Package", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0139.html", + "node_id":"dataartsstudio_01_0139.xml", + "product_code":"dataartsstudio", + "code":"15", + "des":"DataArts Studio provides basic and incremental packages. If the basic package cannot meet your demands, you need to create an incremental package.Table 1 lists the increm", + "doc_type":"usermanual", + "kw":"Introduction to Incremental Packages,Creating a DataArts Studio Incremental Package,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Introduction to Incremental Packages", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0119.html", + "node_id":"dataartsstudio_01_0119.xml", + "product_code":"dataartsstudio", + "code":"16", + "des":"A DataArts Migration (that is, CDM) incremental package provides resources for a CDM cluster. When you create a CDM incremental package, the system automatically creates ", + "doc_type":"usermanual", + "kw":"Creating a DataArts Migration Incremental Package,Creating a DataArts Studio Incremental Package,Use", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Creating a DataArts Migration Incremental Package", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0145.html", + "node_id":"dataartsstudio_01_0145.xml", + "product_code":"dataartsstudio", + "code":"17", + "des":"This type of incremental package provides resource groups for real-time jobs in DataArts Migration. DataArts Migration resource groups can be used to migrate data to the ", + "doc_type":"usermanual", + "kw":"Creating a DataArts Migration Resource Group Incremental Package,Creating a DataArts Studio Incremen", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Creating a DataArts Migration Resource Group Incremental Package", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0001.html", + "node_id":"dataartsstudio_01_0001.xml", + "product_code":"dataartsstudio", + "code":"18", + "des":"You have obtained a DataArts Studio instance. For details, see Creating a DataArts Studio Instance.If there are multiple DataArts Studio instances in the current region, ", + "doc_type":"usermanual", + "kw":"Accessing the DataArts Studio Instance Console,Creating and Configuring a DataArts Studio Instance,U", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Accessing the DataArts Studio Instance Console", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0134.html", + "node_id":"dataartsstudio_01_0134.xml", + "product_code":"dataartsstudio", + "code":"19", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "doc_type":"usermanual", + "kw":"Creating and Configuring a Workspace in Simple Mode", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Creating and Configuring a Workspace in Simple Mode", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0116.html", + "node_id":"dataartsstudio_01_0116.xml", + "product_code":"dataartsstudio", + "code":"20", + "des":"The system creates a default workspace named default for the DataArts Studio instance you create and assigns administrator permissions to you. You can use the default wor", + "doc_type":"usermanual", + "kw":"Creating a Workspace in Simple Mode,Creating and Configuring a Workspace in Simple Mode,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Creating a Workspace in Simple Mode", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0530.html", + "node_id":"dataartsstudio_01_0530.xml", + "product_code":"dataartsstudio", + "code":"21", + "des":"By default, job logs and DLI dirty data are stored in an OBS bucket named dlf-log-{project ID}. You can customize a storage path for logs and one for DLI dirty data. You ", + "doc_type":"usermanual", + "kw":"(Optional) Changing the Job Log Storage Path,Creating and Configuring a Workspace in Simple Mode,Use", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"(Optional) Changing the Job Log Storage Path", "githuburl":"" }, { "uri":"dataartsstudio_01_5098.html", "node_id":"dataartsstudio_01_5098.xml", "product_code":"dataartsstudio", - "code":"28", + "code":"22", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Enterprise Mode", + "kw":"(Optional) Creating and Using a Workspace in Enterprise Mode", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Enterprise Mode", + "title":"(Optional) Creating and Using a Workspace in Enterprise Mode", "githuburl":"" }, { "uri":"dataartsstudio_01_5099.html", "node_id":"dataartsstudio_01_5099.xml", "product_code":"dataartsstudio", - "code":"29", + "code":"23", "des":"DataArts Studio provides two workspace modes, the simplified mode and enterprise mode, to help you manage your production data with varied security control requirements. ", "doc_type":"usermanual", - "kw":"DataArts Studio Enterprise Mode Overview,Enterprise Mode,User Guide", + "kw":"Introduction to the Enterprise Mode,(Optional) Creating and Using a Workspace in Enterprise Mode,Use", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"DataArts Studio Enterprise Mode Overview", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_5100.html", - "node_id":"dataartsstudio_01_5100.xml", - "product_code":"dataartsstudio", - "code":"30", - "des":"The DataArts Studio enterprise mode mainly involves the Management Center and DataArts Factory components. The service process is completed by the admin, developer, deplo", - "doc_type":"usermanual", - "kw":"Service Process in Enterprise Mode,Enterprise Mode,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsBot":"No;yes", - "IsMulti":"No;no", - "documenttype":"usermanual", - "prodname":"dataartsstudio" - } - ], - "title":"Service Process in Enterprise Mode", + "title":"Introduction to the Enterprise Mode", "githuburl":"" }, { "uri":"dataartsstudio_01_5135.html", "node_id":"dataartsstudio_01_5135.xml", "product_code":"dataartsstudio", - "code":"31", + "code":"24", "des":"If you are using a workspace in simple mode and want to isolate the development and production environments, you can upgrade the workspace to one in enterprise mode. If y", "doc_type":"usermanual", - "kw":"Creating a Workspace in Enterprise Mode,Enterprise Mode,User Guide", + "kw":"Creating a Workspace in Enterprise Mode,(Optional) Creating and Using a Workspace in Enterprise Mode", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -663,18 +519,60 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_5101.html", - "node_id":"dataartsstudio_01_5101.xml", + "uri":"dataartsstudio_01_5106.html", + "node_id":"dataartsstudio_01_5106.xml", "product_code":"dataartsstudio", - "code":"32", - "des":"As the project owner or development owner, the admin manages the environment configuration and personnel roles in enterprise mode in a unified manner. The following table", + "code":"25", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Admin Operations,Enterprise Mode,User Guide", + "kw":"Operations Supported for Different Roles in Enterprise Mode", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Operations Supported for Different Roles in Enterprise Mode", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_5100.html", + "node_id":"dataartsstudio_01_5100.xml", + "product_code":"dataartsstudio", + "code":"26", + "des":"The DataArts Studio enterprise mode mainly involves the Management Center and DataArts Factory components. The service process is completed by the admin, developer, deplo", + "doc_type":"usermanual", + "kw":"Service Process in Enterprise Mode,Operations Supported for Different Roles in Enterprise Mode,User ", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Service Process in Enterprise Mode", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_5101.html", + "node_id":"dataartsstudio_01_5101.xml", + "product_code":"dataartsstudio", + "code":"27", + "des":"As the project owner or development owner, the admin manages the environment configuration and personnel roles in enterprise mode in a unified manner. The following table", + "doc_type":"usermanual", + "kw":"Admin Operations,Operations Supported for Different Roles in Enterprise Mode,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -687,15 +585,15 @@ "uri":"dataartsstudio_01_5102.html", "node_id":"dataartsstudio_01_5102.xml", "product_code":"dataartsstudio", - "code":"33", + "code":"28", "des":"The developer develops scripts and jobs. The following table describes related operations.", "doc_type":"usermanual", - "kw":"Developer Operations,Enterprise Mode,User Guide", + "kw":"Developer Operations,Operations Supported for Different Roles in Enterprise Mode,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -708,15 +606,15 @@ "uri":"dataartsstudio_01_5103.html", "node_id":"dataartsstudio_01_5103.xml", "product_code":"dataartsstudio", - "code":"34", + "code":"29", "des":"The deployer reviews the tasks to be released. This section describes related operations.The deployer reviews the release tasks submitted by the developer. Modified jobs ", "doc_type":"usermanual", - "kw":"Deployer Operations,Enterprise Mode,User Guide", + "kw":"Deployer Operations,Operations Supported for Different Roles in Enterprise Mode,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -729,15 +627,15 @@ "uri":"dataartsstudio_01_5104.html", "node_id":"dataartsstudio_01_5104.xml", "product_code":"dataartsstudio", - "code":"35", + "code":"30", "des":"The operator manages the jobs, instances, notifications, and backups in the production environment in a unified manner. The following table describes related operations.", "doc_type":"usermanual", - "kw":"Operator Operations,Enterprise Mode,User Guide", + "kw":"Operator Operations,Operations Supported for Different Roles in Enterprise Mode,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -746,11 +644,137 @@ "title":"Operator Operations", "githuburl":"" }, + { + "uri":"dataartsstudio_01_4105.html", + "node_id":"dataartsstudio_01_4105.xml", + "product_code":"dataartsstudio", + "code":"31", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "doc_type":"usermanual", + "kw":"Managing DataArts Studio Resources", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Managing DataArts Studio Resources", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_7587.html", + "node_id":"dataartsstudio_01_7587.xml", + "product_code":"dataartsstudio", + "code":"32", + "des":"Before creating a real-time data migration job, you need to associate the data migration resource group with a DataArts Studio workspace so that you can select a specifie", + "doc_type":"usermanual", + "kw":"Associating a Real-Time Migration Resource Group with Workspaces,Managing DataArts Studio Resources,", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Associating a Real-Time Migration Resource Group with Workspaces", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0118.html", + "node_id":"dataartsstudio_01_0118.xml", + "product_code":"dataartsstudio", + "code":"33", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "doc_type":"usermanual", + "kw":"Authorizing Users to Use DataArts Studio", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Authorizing Users to Use DataArts Studio", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0004.html", + "node_id":"dataartsstudio_01_0004.xml", + "product_code":"dataartsstudio", + "code":"34", + "des":"Identity and Access Management (IAM) can be used for fine-grained permissions management on your DataArts Studio resources. With IAM, you can:Create IAM users for employe", + "doc_type":"usermanual", + "kw":"Creating an IAM User and Assigning DataArts Studio Permissions,Authorizing Users to Use DataArts Stu", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Creating an IAM User and Assigning DataArts Studio Permissions", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0107.html", + "node_id":"dataartsstudio_01_0107.xml", + "product_code":"dataartsstudio", + "code":"35", + "des":"For IAM users with DARTS User account permissions, DataArts Studio workspace roles determine their permissions in workspaces. Preset roles include admin, developer, deplo", + "doc_type":"usermanual", + "kw":"(Optional) Defining a Workspace Role,Authorizing Users to Use DataArts Studio,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"(Optional) Defining a Workspace Role", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0117.html", + "node_id":"dataartsstudio_01_0117.xml", + "product_code":"dataartsstudio", + "code":"36", + "des":"For IAM users with DARTS User account permissions, their permissions in a DataArts Studio workspace are determined by workspace roles. If you want to share a DataArts Stu", + "doc_type":"usermanual", + "kw":"Adding Workspace Members and Assigning Roles,Authorizing Users to Use DataArts Studio,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Adding Workspace Members and Assigning Roles", + "githuburl":"" + }, { "uri":"dataartsstudio_01_0008.html", "node_id":"dataartsstudio_01_0008.xml", "product_code":"dataartsstudio", - "code":"36", + "code":"37", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Management Center", @@ -758,7 +782,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -768,45 +792,24 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0005_0.html", - "node_id":"dataartsstudio_01_0005_0.xml", - "product_code":"dataartsstudio", - "code":"37", - "des":"Before using DataArts Studio, you need to select cloud services or databases as the data lake foundation, which provides storage and compute capabilities. DataArts Studio", - "doc_type":"usermanual", - "kw":"Data Sources,Management Center,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsBot":"No;yes", - "IsMulti":"No;no", - "documenttype":"usermanual", - "prodname":"dataartsstudio" - } - ], - "title":"Data Sources", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0009.html", - "node_id":"dataartsstudio_01_0009.xml", + "uri":"dataartsstudio_01_0005.html", + "node_id":"dataartsstudio_01_0005.xml", "product_code":"dataartsstudio", "code":"38", - "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "des":"Before using DataArts Studio, you need to select cloud services or databases as the data foundation, which provides storage and compute capabilities. DataArts Studio prov", "doc_type":"usermanual", - "kw":"Managing Data Connections", + "kw":"Data Sources Supported by DataArts Studio,Management Center,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Managing Data Connections", + "title":"Data Sources Supported by DataArts Studio", "githuburl":"" }, { @@ -816,453 +819,558 @@ "code":"39", "des":"You can create data connections by configuring data sources. Based on the data connections of the Management Center, DataArts Studio performs data development, governance", "doc_type":"usermanual", - "kw":"Creating a Data Connection,Managing Data Connections,User Guide", + "kw":"Creating a DataArts Studio Data Connection,Management Center,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Creating a Data Connection", + "title":"Creating a DataArts Studio Data Connection", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0009.html", + "node_id":"dataartsstudio_01_0009.xml", + "product_code":"dataartsstudio", + "code":"40", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "doc_type":"usermanual", + "kw":"Configuring DataArts Studio Data Connection Parameters", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Configuring DataArts Studio Data Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1300.html", "node_id":"dataartsstudio_01_1300.xml", "product_code":"dataartsstudio", - "code":"40", + "code":"41", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Configuring a DWS Connection,Managing Data Connections,User Guide", + "kw":"DWS Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring a DWS Connection", + "title":"DWS Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1301.html", "node_id":"dataartsstudio_01_1301.xml", "product_code":"dataartsstudio", - "code":"41", + "code":"42", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Configuring a DLI Connection,Managing Data Connections,User Guide", + "kw":"DLI Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring a DLI Connection", + "title":"DLI Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1306.html", "node_id":"dataartsstudio_01_1306.xml", "product_code":"dataartsstudio", - "code":"42", + "code":"43", "des":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "doc_type":"usermanual", - "kw":"Configuring an MRS Hive Connection,Managing Data Connections,User Guide", + "kw":"MRS Hive Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an MRS Hive Connection", + "title":"MRS Hive Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1307.html", "node_id":"dataartsstudio_01_1307.xml", "product_code":"dataartsstudio", - "code":"43", + "code":"44", "des":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "doc_type":"usermanual", - "kw":"Configuring an MRS HBase Connection,Managing Data Connections,User Guide", + "kw":"MRS HBase Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an MRS HBase Connection", + "title":"MRS HBase Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1308.html", "node_id":"dataartsstudio_01_1308.xml", "product_code":"dataartsstudio", - "code":"44", + "code":"45", "des":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "doc_type":"usermanual", - "kw":"Configuring an MRS Kafka Connection,Managing Data Connections,User Guide", + "kw":"MRS Kafka Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an MRS Kafka Connection", + "title":"MRS Kafka Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1314.html", "node_id":"dataartsstudio_01_1314.xml", "product_code":"dataartsstudio", - "code":"45", + "code":"46", "des":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "doc_type":"usermanual", - "kw":"Configuring an MRS Spark Connection,Managing Data Connections,User Guide", + "kw":"MRS Spark Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an MRS Spark Connection", + "title":"MRS Spark Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1309.html", "node_id":"dataartsstudio_01_1309.xml", "product_code":"dataartsstudio", - "code":"46", + "code":"47", "des":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "doc_type":"usermanual", - "kw":"Configuring an MRS ClickHouse Connection,Managing Data Connections,User Guide", + "kw":"MRS ClickHouse Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Gui", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an MRS ClickHouse Connection", + "title":"MRS ClickHouse Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1310.html", "node_id":"dataartsstudio_01_1310.xml", "product_code":"dataartsstudio", - "code":"47", + "code":"48", "des":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "doc_type":"usermanual", - "kw":"Configuring an MRS Hetu Connection,Managing Data Connections,User Guide", + "kw":"MRS Hetu Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an MRS Hetu Connection", + "title":"MRS Hetu Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1311.html", "node_id":"dataartsstudio_01_1311.xml", "product_code":"dataartsstudio", - "code":"48", + "code":"49", "des":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "doc_type":"usermanual", - "kw":"Configuring an MRS Impala Connection,Managing Data Connections,User Guide", + "kw":"MRS Impala Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an MRS Impala Connection", + "title":"MRS Impala Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1390.html", "node_id":"dataartsstudio_01_1390.xml", "product_code":"dataartsstudio", - "code":"49", + "code":"50", "des":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "doc_type":"usermanual", - "kw":"Configuring an MRS Doris Connection,Managing Data Connections,User Guide", + "kw":"Doris Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an MRS Doris Connection", + "title":"Doris Connection Parameters", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_1321.html", + "node_id":"dataartsstudio_01_1321.xml", + "product_code":"dataartsstudio", + "code":"51", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "doc_type":"usermanual", + "kw":"OpenSource ClickHouse Connection Parameters,Configuring DataArts Studio Data Connection Parameters,U", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"OpenSource ClickHouse Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1303.html", "node_id":"dataartsstudio_01_1303.xml", "product_code":"dataartsstudio", - "code":"50", - "des":"You can create connections to RDS databases including MySQL, PostgreSQL, SQL Server, SAP HANA, and DM databases.", + "code":"52", + "des":"RDS connections can be used to connect to MySQL, PostgreSQL, and SQL Server databases.", "doc_type":"usermanual", - "kw":"Configuring an RDS Connection,Managing Data Connections,User Guide", + "kw":"RDS Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an RDS Connection", + "title":"RDS Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1302.html", "node_id":"dataartsstudio_01_1302.xml", "product_code":"dataartsstudio", - "code":"51", + "code":"53", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Configuring an Oracle Connection,Managing Data Connections,User Guide", + "kw":"Oracle Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring an Oracle Connection", + "title":"Oracle Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1305.html", "node_id":"dataartsstudio_01_1305.xml", "product_code":"dataartsstudio", - "code":"52", + "code":"54", "des":"The maximum number of shell or Python scripts that can run concurrently on the ECS is determined by the value of MaxSessions in the /etc/ssh/sshd_config file on the ECS. ", "doc_type":"usermanual", - "kw":"Configuring a Host Connection,Managing Data Connections,User Guide", + "kw":"Host Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring a Host Connection", + "title":"Host Connection Parameters", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_1620.html", + "node_id":"dataartsstudio_01_1620.xml", + "product_code":"dataartsstudio", + "code":"55", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "doc_type":"usermanual", + "kw":"Rest Client Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Rest Client Connection Parameters", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_1509.html", + "node_id":"dataartsstudio_01_1509.xml", + "product_code":"dataartsstudio", + "code":"56", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "doc_type":"usermanual", + "kw":"Redis Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Redis Connection Parameters", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_1510.html", + "node_id":"dataartsstudio_01_1510.xml", + "product_code":"dataartsstudio", + "code":"57", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "doc_type":"usermanual", + "kw":"SAP HANA Connection Parameters,Configuring DataArts Studio Data Connection Parameters,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"SAP HANA Connection Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0010.html", "node_id":"dataartsstudio_01_0010.xml", "product_code":"dataartsstudio", - "code":"53", - "des":"To migrate resources in one workspace to another, you can use the resource migration function provided by DataArts Studio.Resources that can be migrated include the data ", + "code":"58", + "des":"To migrate resources in one workspace to another, you can use the resource migration function provided by DataArts Studio.Resources can be imported from OBS or a local pa", "doc_type":"usermanual", - "kw":"Migrating Resources,Management Center,User Guide", + "kw":"Configuring DataArts Studio Resource Migration,Management Center,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Migrating Resources", + "title":"Configuring DataArts Studio Resource Migration", "githuburl":"" }, { "uri":"dataartsstudio_01_5105.html", "node_id":"dataartsstudio_01_5105.xml", "product_code":"dataartsstudio", - "code":"54", + "code":"59", "des":"You can configure isolation between the development and production environments for DLI and DB.After the environment isolation is configured, the data connection in the d", "doc_type":"usermanual", - "kw":"Configuring Environment Isolation for a Workspace in Enterprise Mode,Management Center,User Guide", + "kw":"Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode,Management Cent", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring Environment Isolation for a Workspace in Enterprise Mode", + "title":"Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode", "githuburl":"" }, { "uri":"dataartsstudio_01_0350.html", "node_id":"dataartsstudio_01_0350.xml", "product_code":"dataartsstudio", - "code":"55", + "code":"60", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Tutorials", + "kw":"Typical Scenarios for Using Management Center", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Tutorials", + "title":"Typical Scenarios for Using Management Center", "githuburl":"" }, { "uri":"dataartsstudio_01_0351.html", "node_id":"dataartsstudio_01_0351.xml", "product_code":"dataartsstudio", - "code":"56", + "code":"61", "des":"This section describes how to create an MRS Hive connection between DataArts Studio and the data lake base.You have created a data lake to connect, for example, a databas", "doc_type":"usermanual", - "kw":"Creating an MRS Hive Connection,Tutorials,User Guide", + "kw":"Creating a Connection Between DataArts Studio and an MRS Hive Data Lake,Typical Scenarios for Using ", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Creating an MRS Hive Connection", + "title":"Creating a Connection Between DataArts Studio and an MRS Hive Data Lake", "githuburl":"" }, { "uri":"dataartsstudio_01_0352.html", "node_id":"dataartsstudio_01_0352.xml", "product_code":"dataartsstudio", - "code":"57", + "code":"62", "des":"This section describes how to create a DWS connection between DataArts Studio and the data lake base.You have created a data lake to connect, for example, a database or c", "doc_type":"usermanual", - "kw":"Creating a DWS Connection,Tutorials,User Guide", + "kw":"Creating a Connection Between DataArts Studio and a GaussDB(DWS) Data Lake,Typical Scenarios for Usi", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Creating a DWS Connection", + "title":"Creating a Connection Between DataArts Studio and a GaussDB(DWS) Data Lake", "githuburl":"" }, { "uri":"dataartsstudio_01_0353.html", "node_id":"dataartsstudio_01_0353.xml", "product_code":"dataartsstudio", - "code":"58", + "code":"63", "des":"This section describes how to create a MySQL connection between DataArts Studio and the data lake base.You have created a data lake to connect, for example, a database or", "doc_type":"usermanual", - "kw":"Creating a MySQL Connection,Tutorials,User Guide", + "kw":"Creating a Connection Between DataArts Studio and a MySQL Database,Typical Scenarios for Using Manag", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Creating a MySQL Connection", + "title":"Creating a Connection Between DataArts Studio and a MySQL Database", "githuburl":"" }, { "uri":"dataartsstudio_01_0012.html", "node_id":"dataartsstudio_01_0012.xml", "product_code":"dataartsstudio", - "code":"59", + "code":"64", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"DataArts Migration", + "kw":"DataArts Migration (CDM Jobs)", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"DataArts Migration", + "title":"DataArts Migration (CDM Jobs)", "githuburl":"" }, { "uri":"dataartsstudio_01_0013.html", "node_id":"dataartsstudio_01_0013.xml", "product_code":"dataartsstudio", - "code":"60", + "code":"65", "des":"DataArts Migration is an efficient and easy-to-use data integration service. Based on the big data migration to the cloud and intelligent data lake solutions, CDM provide", "doc_type":"usermanual", - "kw":"Overview,DataArts Migration,User Guide", + "kw":"Overview,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -1275,28 +1383,28 @@ "uri":"dataartsstudio_01_0015.html", "node_id":"dataartsstudio_01_0015.xml", "product_code":"dataartsstudio", - "code":"61", - "des":"You cannot modify the flavor of an existing cluster. If you require a higher flavor, create a cluster with your desired flavor.Arm CDM clusters do not support agents. The", + "code":"66", + "des":"You cannot modify the flavor of an existing cluster. If you require a higher flavor, create a cluster with your desired flavor.The CDM cluster version (Arm or x86) is det", "doc_type":"usermanual", - "kw":"Constraints,DataArts Migration,User Guide", + "kw":"Notes and Constraints,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Constraints", + "title":"Notes and Constraints", "githuburl":"" }, { "uri":"dataartsstudio_01_0215.html", "node_id":"dataartsstudio_01_0215.xml", "product_code":"dataartsstudio", - "code":"62", + "code":"67", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Supported Data Sources", @@ -1304,7 +1412,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -1317,7 +1425,7 @@ "uri":"dataartsstudio_01_0196.html", "node_id":"dataartsstudio_01_0196.xml", "product_code":"dataartsstudio", - "code":"63", + "code":"68", "des":"CDM provides the following migration modes which support different data sources:Table/File migration in the import of data into a data lake or migration of data to the cl", "doc_type":"usermanual", "kw":"Supported Data Sources (2.10.0.300),Supported Data Sources,User Guide", @@ -1325,7 +1433,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -1334,32 +1442,11 @@ "title":"Supported Data Sources (2.10.0.300)", "githuburl":"" }, - { - "uri":"dataartsstudio_01_0197.html", - "node_id":"dataartsstudio_01_0197.xml", - "product_code":"dataartsstudio", - "code":"64", - "des":"CDM provides the following migration modes which support different data sources:Table/File migration in the import of data into a data lake or migration of data to the cl", - "doc_type":"usermanual", - "kw":"Supported Data Sources (2.10.0.100),Supported Data Sources,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsBot":"No;yes", - "IsMulti":"No;no", - "documenttype":"usermanual", - "prodname":"dataartsstudio" - } - ], - "title":"Supported Data Sources (2.10.0.100)", - "githuburl":"" - }, { "uri":"dataartsstudio_01_0014.html", "node_id":"dataartsstudio_01_0014.xml", "product_code":"dataartsstudio", - "code":"65", + "code":"69", "des":"CDM provides the following migration modes which support different data sources:Table/File migration in the import of data into a data lake or migration of data to the cl", "doc_type":"usermanual", "kw":"Supported Data Sources (2.9.3.300),Supported Data Sources,User Guide", @@ -1367,7 +1454,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -1380,7 +1467,7 @@ "uri":"dataartsstudio_01_0816.html", "node_id":"dataartsstudio_01_0816.xml", "product_code":"dataartsstudio", - "code":"66", + "code":"70", "des":"CDM provides the following migration modes which support different data sources:Table/File migration in the import of data into a data lake or migration of data to the cl", "doc_type":"usermanual", "kw":"Supported Data Sources (2.9.2.200),Supported Data Sources,User Guide", @@ -1388,7 +1475,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -1401,7 +1488,7 @@ "uri":"dataartsstudio_01_0224.html", "node_id":"dataartsstudio_01_0224.xml", "product_code":"dataartsstudio", - "code":"67", + "code":"71", "des":"To ensure that data is completely imported to the migration destination, correctly configure field mappings based on data types supported for different data sources. For ", "doc_type":"usermanual", "kw":"Supported Data Types,Supported Data Sources,User Guide", @@ -1409,7 +1496,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -1422,36 +1509,36 @@ "uri":"dataartsstudio_01_0017.html", "node_id":"dataartsstudio_01_0017.xml", "product_code":"dataartsstudio", - "code":"68", + "code":"72", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Managing Clusters", + "kw":"Creating and Managing a CDM Cluster", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Managing Clusters", + "title":"Creating and Managing a CDM Cluster", "githuburl":"" }, { "uri":"dataartsstudio_01_0576.html", "node_id":"dataartsstudio_01_0576.xml", "product_code":"dataartsstudio", - "code":"69", + "code":"73", "des":"CDM provides independent clusters for secure and reliable data migration. Clusters are isolated from each other and cannot access each other.CDM clusters can be used in t", "doc_type":"usermanual", - "kw":"Creating a CDM Cluster,Managing Clusters,User Guide", + "kw":"Creating a CDM Cluster,Creating and Managing a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -1461,18 +1548,18 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0020_0.html", - "node_id":"dataartsstudio_01_0020_0.xml", + "uri":"dataartsstudio_01_0586.html", + "node_id":"dataartsstudio_01_0586.xml", "product_code":"dataartsstudio", - "code":"70", + "code":"74", "des":"After creating a CDM cluster, you can bind an EIP to or unbind an EIP from the cluster.If CDM needs to access a local or Internet data source, or a cloud service in anoth", "doc_type":"usermanual", - "kw":"Binding or Unbinding an EIP,Managing Clusters,User Guide", + "kw":"Binding or Unbinding an EIP,Creating and Managing a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -1485,120 +1572,120 @@ "uri":"dataartsstudio_01_0578.html", "node_id":"dataartsstudio_01_0578.xml", "product_code":"dataartsstudio", - "code":"71", - "des":"After modifying some configurations (for example, disabling user isolation), you must restart the cluster to make the modification take effect.You have created a CDM clus", + "code":"75", + "des":"After modifying some configurations (for example, disabling user isolation), you must restart the cluster to make the modification take effect.If you restart a CDM cluste", "doc_type":"usermanual", - "kw":"Restarting a Cluster,Managing Clusters,User Guide", + "kw":"Restarting a CDM Cluster,Creating and Managing a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Restarting a Cluster", + "title":"Restarting a CDM Cluster", "githuburl":"" }, { "uri":"dataartsstudio_01_0579.html", "node_id":"dataartsstudio_01_0579.xml", "product_code":"dataartsstudio", - "code":"72", + "code":"76", "des":"You can delete a CDM cluster that you no longer use.After a CDM cluster is deleted, the cluster and its data are destroyed and cannot be restored. Exercise caution when p", "doc_type":"usermanual", - "kw":"Deleting a Cluster,Managing Clusters,User Guide", + "kw":"Deleting a CDM Cluster,Creating and Managing a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Deleting a Cluster", + "title":"Deleting a CDM Cluster", "githuburl":"" }, { "uri":"dataartsstudio_01_0022.html", "node_id":"dataartsstudio_01_0022.xml", "product_code":"dataartsstudio", - "code":"73", + "code":"77", "des":"This section describes how to obtain cluster logs to view the job running history and locate job failure causes.You have created a CDM cluster.", "doc_type":"usermanual", - "kw":"Downloading Cluster Logs,Managing Clusters,User Guide", + "kw":"Downloading CDM Cluster Logs,Creating and Managing a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Downloading Cluster Logs", + "title":"Downloading CDM Cluster Logs", "githuburl":"" }, { - "uri":"dataartsstudio_01_0021_0.html", - "node_id":"dataartsstudio_01_0021_0.xml", + "uri":"dataartsstudio_01_0587.html", + "node_id":"dataartsstudio_01_0587.xml", "product_code":"dataartsstudio", - "code":"74", - "des":"After creating a CDM cluster, you can view its basic information and modify its configurations.You can view the following basic cluster information:Cluster information: c", + "code":"78", + "des":"After creating a CDM cluster, you can view its basic information and modify its configurations.You can view the following basic cluster information:Cluster Information: c", "doc_type":"usermanual", - "kw":"Viewing Basic Cluster Information and Modifying Cluster Configurations,Managing Clusters,User Guide", + "kw":"Viewing and Modifying CDM Cluster Configurations,Creating and Managing a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Viewing Basic Cluster Information and Modifying Cluster Configurations", + "title":"Viewing and Modifying CDM Cluster Configurations", "githuburl":"" }, { "uri":"dataartsstudio_01_0121.html", "node_id":"dataartsstudio_01_0121.xml", "product_code":"dataartsstudio", - "code":"75", + "code":"79", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Viewing Metrics", + "kw":"Managing and Viewing CDM Metrics", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Viewing Metrics", + "title":"Managing and Viewing CDM Metrics", "githuburl":"" }, { "uri":"dataartsstudio_01_0122.html", "node_id":"dataartsstudio_01_0122.xml", "product_code":"dataartsstudio", - "code":"76", + "code":"80", "des":"Cloud Eye monitors the running status of cloud services and usage of each metric, and creates alarm rules for monitoring metrics.After you create a CDM cluster, Cloud Eye", "doc_type":"usermanual", - "kw":"CDM Metrics,Viewing Metrics,User Guide", + "kw":"CDM Metrics,Managing and Viewing CDM Metrics,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -1611,729 +1698,750 @@ "uri":"dataartsstudio_01_0123.html", "node_id":"dataartsstudio_01_0123.xml", "product_code":"dataartsstudio", - "code":"77", + "code":"81", "des":"Set the alarm rules to customize the monitored objects and notification policies. Then, learn CDM running status in a timely manner.A CDM alarm rule includes the alarm ru", "doc_type":"usermanual", - "kw":"Configuring Alarm Rules,Viewing Metrics,User Guide", + "kw":"Configuring CDM Alarm Rules,Managing and Viewing CDM Metrics,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring Alarm Rules", + "title":"Configuring CDM Alarm Rules", "githuburl":"" }, { "uri":"dataartsstudio_01_0124.html", "node_id":"dataartsstudio_01_0124.xml", "product_code":"dataartsstudio", - "code":"78", + "code":"82", "des":"You can use Cloud Eye to monitor the running status of a CDM cluster. You can view the monitoring metrics on the Cloud Eye console.Monitored data takes some time for tran", "doc_type":"usermanual", - "kw":"Querying Metrics,Viewing Metrics,User Guide", + "kw":"Querying CDM Metrics,Managing and Viewing CDM Metrics,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Querying Metrics", + "title":"Querying CDM Metrics", "githuburl":"" }, { "uri":"dataartsstudio_01_0023.html", "node_id":"dataartsstudio_01_0023.xml", "product_code":"dataartsstudio", - "code":"79", + "code":"83", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Managing Links", + "kw":"Creating a Link in a CDM Cluster", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Managing Links", + "title":"Creating a Link in a CDM Cluster", "githuburl":"" }, { "uri":"dataartsstudio_01_0024.html", "node_id":"dataartsstudio_01_0024.xml", "product_code":"dataartsstudio", - "code":"80", + "code":"84", "des":"Before creating a data migration job, create a link to enable the CDM cluster to read data from and write data to a data source. A migration job requires a source link an", "doc_type":"usermanual", - "kw":"Creating Links,Managing Links,User Guide", + "kw":"Creating a Link Between CDM and a Data Source,Creating a Link in a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Creating Links", + "title":"Creating a Link Between CDM and a Data Source", "githuburl":"" }, { - "uri":"dataartsstudio_01_0132.html", - "node_id":"dataartsstudio_01_0132.xml", + "uri":"dataartsstudio_01_0157.html", + "node_id":"dataartsstudio_01_0157.xml", "product_code":"dataartsstudio", - "code":"81", - "des":"The Java Database Connectivity (JDBC) provides programmatic access to relational databases. Applications can execute SQL statements and retrieve data using the JDBC API.B", + "code":"85", + "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Managing Drivers,Managing Links,User Guide", + "kw":"Configuring Link Parameters", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Managing Drivers", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0128.html", - "node_id":"dataartsstudio_01_0128.xml", - "product_code":"dataartsstudio", - "code":"82", - "des":"If your data is stored in HDFS or a relational database, you can deploy an agent on the source network. CDM pulls data from your internal data sources through an agent bu", - "doc_type":"usermanual", - "kw":"Managing Agents,Managing Links,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsBot":"No;yes", - "IsMulti":"No;no", - "documenttype":"usermanual", - "prodname":"dataartsstudio" - } - ], - "title":"Managing Agents", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_1096.html", - "node_id":"dataartsstudio_01_1096.xml", - "product_code":"dataartsstudio", - "code":"83", - "des":"On the Cluster Configurations page, you can create, edit, or delete Hadoop cluster configurations.When creating a Hadoop link, the Hadoop cluster configurations can simpl", - "doc_type":"usermanual", - "kw":"Managing Cluster Configurations,Managing Links,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsBot":"No;yes", - "IsMulti":"No;no", - "documenttype":"usermanual", - "prodname":"dataartsstudio" - } - ], - "title":"Managing Cluster Configurations", + "title":"Configuring Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0045.html", "node_id":"dataartsstudio_01_0045.xml", "product_code":"dataartsstudio", - "code":"84", + "code":"86", "des":"When connecting CDM to the destination OBS bucket, you need to add the read and write permissions to the destination OBS bucket, and file authentication is not required.I", "doc_type":"usermanual", - "kw":"Link to OBS,Managing Links,User Guide", + "kw":"OBS Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to OBS", + "title":"OBS Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0044.html", "node_id":"dataartsstudio_01_0044.xml", "product_code":"dataartsstudio", - "code":"85", - "des":"Table 1 lists the parameters for creating a link to PostgreSQL/SQLServer.Do not change the password or user when the job is running. If you do so, the password will not t", + "code":"87", + "des":"Table 1 lists the parameters for creating a link to PostgreSQL/SQLServer. Greenplum, Kingbase, and GaussDB can be connected through the PostgreSQL connector. The source a", "doc_type":"usermanual", - "kw":"Link to PostgreSQL/SQLServer,Managing Links,User Guide", + "kw":"PostgreSQL/SQLServer Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to PostgreSQL/SQLServer", + "title":"PostgreSQL/SQLServer Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0226.html", "node_id":"dataartsstudio_01_0226.xml", "product_code":"dataartsstudio", - "code":"86", + "code":"88", "des":"Table 1 describes the DWS link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the ", "doc_type":"usermanual", - "kw":"Link to DWS,Managing Links,User Guide", + "kw":"GaussDB(DWS) Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to DWS", + "title":"GaussDB(DWS) Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1211.html", "node_id":"dataartsstudio_01_1211.xml", "product_code":"dataartsstudio", - "code":"87", + "code":"89", "des":"Table 1 lists the parameters for a link to a MySQL database.Do not change the password or user when the job is running. If you do so, the password will not take effect im", "doc_type":"usermanual", - "kw":"Link to an RDS for MySQL/MySQL Database,Managing Links,User Guide", + "kw":"RDS for MySQL/MySQL Database Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to an RDS for MySQL/MySQL Database", + "title":"RDS for MySQL/MySQL Database Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1212.html", "node_id":"dataartsstudio_01_1212.xml", "product_code":"dataartsstudio", - "code":"88", + "code":"90", "des":"Table 1 lists the parameters for a link to an Oracle database.Do not change the password or user when the job is running. If you do so, the password will not take effect ", "doc_type":"usermanual", - "kw":"Link to an Oracle Database,Managing Links,User Guide", + "kw":"Oracle Database Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to an Oracle Database", + "title":"Oracle Database Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0036.html", "node_id":"dataartsstudio_01_0036.xml", "product_code":"dataartsstudio", - "code":"89", + "code":"91", "des":"When connecting CDM to DLI, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the password will n", "doc_type":"usermanual", - "kw":"Link to DLI,Managing Links,User Guide", + "kw":"DLI Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to DLI", + "title":"DLI Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0026.html", "node_id":"dataartsstudio_01_0026.xml", "product_code":"dataartsstudio", - "code":"90", + "code":"92", "des":"CDM supports the following Hive data sources:MRS HiveFusionInsight HiveApache HiveDo not change the password or user when the job is running. If you do so, the password w", "doc_type":"usermanual", - "kw":"Link to Hive,Managing Links,User Guide", + "kw":"Hive Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to Hive", + "title":"Hive Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0039.html", "node_id":"dataartsstudio_01_0039.xml", "product_code":"dataartsstudio", - "code":"91", + "code":"93", "des":"CDM supports the following HBase data sources:MRS HBaseFusionInsight HBaseApache HBaseDo not change the password or user when the job is running. If you do so, the passwo", "doc_type":"usermanual", - "kw":"Link to HBase,Managing Links,User Guide", + "kw":"HBase Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to HBase", + "title":"HBase Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0040.html", "node_id":"dataartsstudio_01_0040.xml", "product_code":"dataartsstudio", - "code":"92", + "code":"94", "des":"CDM supports the following HDFS data sources:MRS HDFSFusionInsight HDFSApache HDFSDo not change the password or user when the job is running. If you do so, the password w", "doc_type":"usermanual", - "kw":"Link to HDFS,Managing Links,User Guide", + "kw":"HDFS Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to HDFS", + "title":"HDFS Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0028.html", "node_id":"dataartsstudio_01_0028.xml", "product_code":"dataartsstudio", - "code":"93", + "code":"95", "des":"The FTP/SFTP link is used to migrate files from the on-premises file server or ECS to a database.Only FTP servers running Linux are supported.Do not change the password o", "doc_type":"usermanual", - "kw":"Link to an FTP or SFTP Server,Managing Links,User Guide", + "kw":"FTP/SFTP Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to an FTP or SFTP Server", + "title":"FTP/SFTP Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0032.html", "node_id":"dataartsstudio_01_0032.xml", "product_code":"dataartsstudio", - "code":"94", + "code":"96", "des":"The Redis link is applicable to data migration of Redis created in the local data center or ECS. It is used to load data in the database or files to Redis.Links to Redis ", "doc_type":"usermanual", - "kw":"Link to Redis,Managing Links,User Guide", + "kw":"Redis Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to Redis", + "title":"Redis Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0031.html", "node_id":"dataartsstudio_01_0031.xml", "product_code":"dataartsstudio", - "code":"95", + "code":"97", "des":"The DDS link is used to synchronize data from Document Database Service (DDS) on the cloud to a big data platform.When connecting CDM to DDS, configure the parameters as ", "doc_type":"usermanual", - "kw":"Link to DDS,Managing Links,User Guide", + "kw":"DDS Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to DDS", + "title":"DDS Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0027.html", "node_id":"dataartsstudio_01_0027.xml", "product_code":"dataartsstudio", - "code":"96", + "code":"98", "des":"When connecting CDM to CloudTable, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the password", "doc_type":"usermanual", - "kw":"Link to CloudTable,Managing Links,User Guide", + "kw":"CloudTable Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to CloudTable", + "title":"CloudTable Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0030.html", "node_id":"dataartsstudio_01_0030.xml", "product_code":"dataartsstudio", - "code":"97", + "code":"99", "des":"This link is used to transfer data from a third-party cloud MongoDB service or MongoDB created in the on-premises data center or ECS to a big data platform.When connectin", "doc_type":"usermanual", - "kw":"Link to MongoDB,Managing Links,User Guide", + "kw":"MongoDB Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to MongoDB", + "title":"MongoDB Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_004501.html", "node_id":"dataartsstudio_01_004501.xml", "product_code":"dataartsstudio", - "code":"98", - "des":"Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.", + "code":"100", + "des":"Cassandra is not supported in version 2.9.3.300 or later.Do not change the password or user when a job is running. If you do so, the password will not take effect immedia", "doc_type":"usermanual", - "kw":"Link to Cassandra,Managing Links,User Guide", + "kw":"Cassandra Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to Cassandra", + "title":"Cassandra Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0033.html", "node_id":"dataartsstudio_01_0033.xml", "product_code":"dataartsstudio", - "code":"99", + "code":"101", "des":"When connecting CDM to Kafka of MRS, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the passwo", "doc_type":"usermanual", - "kw":"Link to Kafka,Managing Links,User Guide", + "kw":"Kafka Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to Kafka", + "title":"Kafka Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0038.html", "node_id":"dataartsstudio_01_0038.xml", "product_code":"dataartsstudio", - "code":"100", + "code":"102", "des":"When connecting CDM to DMS Kafka, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the password ", "doc_type":"usermanual", - "kw":"Link to DMS Kafka,Managing Links,User Guide", + "kw":"DMS Kafka Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to DMS Kafka", + "title":"DMS Kafka Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0035.html", "node_id":"dataartsstudio_01_0035.xml", "product_code":"dataartsstudio", - "code":"101", + "code":"103", "des":"Cloud Search Service (CSS) is a fully hosted distributed search service powered by open-source Elasticsearch. CSS links can be used to migrate log files and database reco", "doc_type":"usermanual", - "kw":"Link to CSS,Managing Links,User Guide", + "kw":"CSS Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to CSS", + "title":"CSS Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1380.html", "node_id":"dataartsstudio_01_1380.xml", "product_code":"dataartsstudio", - "code":"102", + "code":"104", "des":"Elasticsearch links can be used to connect to Elasticsearch services in third-party clouds and local data centers and on Elastic Cloud Servers (ECSs).The Elasticsearch co", "doc_type":"usermanual", - "kw":"Link to Elasticsearch,Managing Links,User Guide", + "kw":"Elasticsearch Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to Elasticsearch", + "title":"Elasticsearch Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0227.html", "node_id":"dataartsstudio_01_0227.xml", "product_code":"dataartsstudio", - "code":"103", + "code":"105", "des":"Table 1 describes the SAP HANA link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and", "doc_type":"usermanual", - "kw":"Link to SAP HANA,Managing Links,User Guide", + "kw":"SAP HANA Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to SAP HANA", + "title":"SAP HANA Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_1214.html", "node_id":"dataartsstudio_01_1214.xml", "product_code":"dataartsstudio", - "code":"104", + "code":"106", "des":"Sharding refers to the link to multiple backend data sources at the same time. The link can be used as the job source to migrate data from multiple data sources to other ", "doc_type":"usermanual", - "kw":"Link to a Database Shard,Managing Links,User Guide", + "kw":"Shard Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to a Database Shard", + "title":"Shard Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0184.html", "node_id":"dataartsstudio_01_0184.xml", "product_code":"dataartsstudio", - "code":"105", + "code":"107", "des":"Table 1 describes the MRS Hudi link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and", "doc_type":"usermanual", - "kw":"Link to MRS Hudi,Managing Links,User Guide", + "kw":"MRS Hudi Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to MRS Hudi", + "title":"MRS Hudi Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0285.html", "node_id":"dataartsstudio_01_0285.xml", "product_code":"dataartsstudio", - "code":"106", + "code":"108", "des":"Table 1 describes the MRS ClickHouse link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediate", "doc_type":"usermanual", - "kw":"Link to MRS ClickHouse,Managing Links,User Guide", + "kw":"MRS ClickHouse Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to MRS ClickHouse", + "title":"MRS ClickHouse Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0290.html", "node_id":"dataartsstudio_01_0290.xml", "product_code":"dataartsstudio", - "code":"107", + "code":"109", "des":"Table 1 lists the parameters for a link to a ShenTong database.Do not change the password or user when the job is running. If you do so, the password will not take effect", "doc_type":"usermanual", - "kw":"Link to a ShenTong Database,Managing Links,User Guide", + "kw":"ShenTong Database Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to a ShenTong Database", + "title":"ShenTong Database Link Parameters", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0288.html", + "node_id":"dataartsstudio_01_0288.xml", + "product_code":"dataartsstudio", + "code":"110", + "des":"Table 1 describes the LogHub (SLS) link parameters.", + "doc_type":"usermanual", + "kw":"LogHub (SLS) Link Parameters,Configuring Link Parameters,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"LogHub (SLS) Link Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0037.html", "node_id":"dataartsstudio_01_0037.xml", "product_code":"dataartsstudio", - "code":"108", + "code":"111", "des":"When connecting CDM to CloudTable OpenTSDB, configure the parameters as described in Table 1.", "doc_type":"usermanual", - "kw":"Link to CloudTable OpenTSDB,Managing Links,User Guide", + "kw":"CloudTable OpenTSDB Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to CloudTable OpenTSDB", + "title":"CloudTable OpenTSDB Link Parameters", "githuburl":"" }, { - "uri":"dataartsstudio_01_1215.html", - "node_id":"dataartsstudio_01_1215.xml", + "uri":"dataartsstudio_01_1628.html", + "node_id":"dataartsstudio_01_1628.xml", "product_code":"dataartsstudio", - "code":"109", - "des":"CDM can connect to open-source Doris and MRS Doris. Table 1 lists the parameters for a Doris link.Do not change the password or user when the job is running. If you do so", + "code":"112", + "des":"Table 1 describes the YASHAN link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and t", "doc_type":"usermanual", - "kw":"Link to Doris,Managing Links,User Guide", + "kw":"YASHAN Link Parameters,Configuring Link Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Link to Doris", + "title":"YASHAN Link Parameters", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0132.html", + "node_id":"dataartsstudio_01_0132.xml", + "product_code":"dataartsstudio", + "code":"113", + "des":"The Java Database Connectivity (JDBC) provides programmatic access to relational databases. Applications can execute SQL statements and retrieve data using the JDBC API.B", + "doc_type":"usermanual", + "kw":"Uploading a CDM Link Driver,Creating a Link in a CDM Cluster,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Uploading a CDM Link Driver", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_1096.html", + "node_id":"dataartsstudio_01_1096.xml", + "product_code":"dataartsstudio", + "code":"114", + "des":"On the Cluster Configurations page, you can create, edit, or delete Hadoop cluster configurations.When creating a Hadoop link, the Hadoop cluster configurations can simpl", + "doc_type":"usermanual", + "kw":"Creating a Hadoop Cluster Configuration,Creating a Link in a CDM Cluster,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Creating a Hadoop Cluster Configuration", "githuburl":"" }, { "uri":"dataartsstudio_01_0081.html", "node_id":"dataartsstudio_01_0081.xml", "product_code":"dataartsstudio", - "code":"110", + "code":"115", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Managing Jobs", + "kw":"Creating a Job in a CDM Cluster", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Managing Jobs", + "title":"Creating a Job in a CDM Cluster", "githuburl":"" }, { "uri":"dataartsstudio_01_0046.html", "node_id":"dataartsstudio_01_0046.xml", "product_code":"dataartsstudio", - "code":"111", + "code":"116", "des":"CDM supports table and file migration between homogeneous or heterogeneous data sources. For details about supported data sources, see Supported Data Sources.The dirty da", "doc_type":"usermanual", - "kw":"Table/File Migration Jobs,Managing Jobs,User Guide", + "kw":"Table/File Migration Jobs,Creating a Job in a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2346,15 +2454,15 @@ "uri":"dataartsstudio_01_0075.html", "node_id":"dataartsstudio_01_0075.xml", "product_code":"dataartsstudio", - "code":"112", + "code":"117", "des":"CDM supports entire DB migration between homogeneous and heterogeneous data sources. The migration principles are the same as those in Table/File Migration Jobs. Each typ", "doc_type":"usermanual", - "kw":"Creating an Entire Database Migration Job,Managing Jobs,User Guide", + "kw":"Creating an Entire Database Migration Job,Creating a Job in a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2367,36 +2475,36 @@ "uri":"dataartsstudio_01_0047.html", "node_id":"dataartsstudio_01_0047.xml", "product_code":"dataartsstudio", - "code":"113", + "code":"118", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Source Job Parameters", + "kw":"Configuring CDM Source Job Parameters", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Source Job Parameters", + "title":"Configuring CDM Source Job Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0048.html", "node_id":"dataartsstudio_01_0048.xml", "product_code":"dataartsstudio", - "code":"114", + "code":"119", "des":"If the source link of a job is an OBS link, configure the source job parameters based on Table 1.Advanced attributes are optional and not displayed by default. You can cl", "doc_type":"usermanual", - "kw":"From OBS,Source Job Parameters,User Guide", + "kw":"From OBS,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2409,15 +2517,15 @@ "uri":"dataartsstudio_01_0049.html", "node_id":"dataartsstudio_01_0049.xml", "product_code":"dataartsstudio", - "code":"115", + "code":"120", "des":"If the source link of a job is an HDFS link, that is, if data is exported from MRS HDFS, FusionInsight HDFS, or Apache HDFS, configure the source job parameters based on ", "doc_type":"usermanual", - "kw":"From HDFS,Source Job Parameters,User Guide", + "kw":"From HDFS,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2430,15 +2538,15 @@ "uri":"dataartsstudio_01_0050.html", "node_id":"dataartsstudio_01_0050.xml", "product_code":"dataartsstudio", - "code":"116", + "code":"121", "des":"If the source link of a job is an HBase or CloudTable link, that is, if data is exported from MRS HBase, FusionInsight HBase, CloudTable, or Apache HBase, configure the s", "doc_type":"usermanual", - "kw":"From HBase/CloudTable,Source Job Parameters,User Guide", + "kw":"From HBase/CloudTable,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2451,15 +2559,15 @@ "uri":"dataartsstudio_01_0051.html", "node_id":"dataartsstudio_01_0051.xml", "product_code":"dataartsstudio", - "code":"117", + "code":"122", "des":"If the source link of a job is a Hive link, configure the source job parameters based on Table 1.If the data source is Hive, CDM will automatically partition data using t", "doc_type":"usermanual", - "kw":"From Hive,Source Job Parameters,User Guide", + "kw":"From Hive,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2469,18 +2577,18 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0120_0.html", - "node_id":"dataartsstudio_01_0120_0.xml", + "uri":"dataartsstudio_01_0120.html", + "node_id":"dataartsstudio_01_0120.xml", "product_code":"dataartsstudio", - "code":"118", + "code":"123", "des":"If the source link of a job is a DLI link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From DLI,Source Job Parameters,User Guide", + "kw":"From DLI,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2493,15 +2601,15 @@ "uri":"dataartsstudio_01_0052.html", "node_id":"dataartsstudio_01_0052.xml", "product_code":"dataartsstudio", - "code":"119", + "code":"124", "des":"If the source link of a job is an FTP or SFTP link, configure the source job parameters based on Table 1.Advanced attributes are optional and not displayed by default. Yo", "doc_type":"usermanual", - "kw":"From FTP/SFTP,Source Job Parameters,User Guide", + "kw":"From FTP/SFTP,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2514,15 +2622,15 @@ "uri":"dataartsstudio_01_0053.html", "node_id":"dataartsstudio_01_0053.xml", "product_code":"dataartsstudio", - "code":"120", + "code":"125", "des":"If the source link of a job is an HTTP link, configure the source job parameters based on Table 1. Currently, data can only be exported from the HTTP URLs.", "doc_type":"usermanual", - "kw":"From HTTP,Source Job Parameters,User Guide", + "kw":"From HTTP,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2535,15 +2643,15 @@ "uri":"dataartsstudio_01_0054.html", "node_id":"dataartsstudio_01_0054.xml", "product_code":"dataartsstudio", - "code":"121", + "code":"126", "des":"If the source link of a job is an RDS for PostgreSQL, RDS for SQL Server, PostgreSQL, or Microsoft SQL Server link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From PostgreSQL/SQL Server,Source Job Parameters,User Guide", + "kw":"From PostgreSQL/SQL Server,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2556,15 +2664,15 @@ "uri":"dataartsstudio_01_0387.html", "node_id":"dataartsstudio_01_0387.xml", "product_code":"dataartsstudio", - "code":"122", + "code":"127", "des":"If the source link of a job is a DWS link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From DWS,Source Job Parameters,User Guide", + "kw":"From DWS,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2577,15 +2685,15 @@ "uri":"dataartsstudio_01_0388.html", "node_id":"dataartsstudio_01_0388.xml", "product_code":"dataartsstudio", - "code":"123", + "code":"128", "des":"Table 1 lists the job parameters when the source link is a SAP HANA link.", "doc_type":"usermanual", - "kw":"From SAP HANA,Source Job Parameters,User Guide", + "kw":"From SAP HANA,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2598,15 +2706,15 @@ "uri":"dataartsstudio_01_1254.html", "node_id":"dataartsstudio_01_1254.xml", "product_code":"dataartsstudio", - "code":"124", + "code":"129", "des":"If the source link of a job is an RDS for MySQL or MySQL link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From MySQL,Source Job Parameters,User Guide", + "kw":"From MySQL,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2619,15 +2727,15 @@ "uri":"dataartsstudio_01_1255.html", "node_id":"dataartsstudio_01_1255.xml", "product_code":"dataartsstudio", - "code":"125", + "code":"130", "des":"If the source link of a job is an Oracle link, configure the source job parameters based on Table 1.When an Oracle database is the migration source, if Partitioning Field", "doc_type":"usermanual", - "kw":"From Oracle,Source Job Parameters,User Guide", + "kw":"From Oracle,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2640,15 +2748,15 @@ "uri":"dataartsstudio_01_1256.html", "node_id":"dataartsstudio_01_1256.xml", "product_code":"dataartsstudio", - "code":"126", + "code":"131", "des":"If the source link of a job is a database shard link, configure the source job parameters based on Table 1.If the Source Link Name is the backend link of the sharded link", "doc_type":"usermanual", - "kw":"From a Database Shard,Source Job Parameters,User Guide", + "kw":"From a Database Shard,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2661,15 +2769,15 @@ "uri":"dataartsstudio_01_0055.html", "node_id":"dataartsstudio_01_0055.xml", "product_code":"dataartsstudio", - "code":"127", + "code":"132", "des":"When you migrate MongoDB or DDS data, CDM reads the first row of the collection as an example of the field list. If the first row of data does not contain all fields of t", "doc_type":"usermanual", - "kw":"From MongoDB/DDS,Source Job Parameters,User Guide", + "kw":"From MongoDB/DDS,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2682,15 +2790,15 @@ "uri":"dataartsstudio_01_0056.html", "node_id":"dataartsstudio_01_0056.xml", "product_code":"dataartsstudio", - "code":"128", + "code":"133", "des":"The Redis service of the third-party cloud cannot serve as the migration source. However, the Redis set up in the on-premises data center or on the ECS can be the migrati", "doc_type":"usermanual", - "kw":"From Redis,Source Job Parameters,User Guide", + "kw":"From Redis,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2703,15 +2811,15 @@ "uri":"dataartsstudio_01_0058.html", "node_id":"dataartsstudio_01_0058.xml", "product_code":"dataartsstudio", - "code":"129", + "code":"134", "des":"If the source link of a job is a Kafka link or DMS Kafka link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From Kafka/DMS Kafka,Source Job Parameters,User Guide", + "kw":"From Kafka/DMS Kafka,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2724,15 +2832,15 @@ "uri":"dataartsstudio_01_0059.html", "node_id":"dataartsstudio_01_0059.xml", "product_code":"dataartsstudio", - "code":"130", - "des":"If the source link of a job is a link described in Link to Elasticsearch or Link to CSS, configure the source job parameters based on Table 1.", + "code":"135", + "des":"If the source link of a job is a link described in Elasticsearch Link Parameters or CSS Link Parameters, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From Elasticsearch or CSS,Source Job Parameters,User Guide", + "kw":"From Elasticsearch or CSS,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2745,15 +2853,15 @@ "uri":"dataartsstudio_01_0060.html", "node_id":"dataartsstudio_01_0060.xml", "product_code":"dataartsstudio", - "code":"131", + "code":"136", "des":"If the source link of a job is a CloudTable OpenTSDB link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From OpenTSDB,Source Job Parameters,User Guide", + "kw":"From OpenTSDB,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2766,15 +2874,15 @@ "uri":"dataartsstudio_01_0185.html", "node_id":"dataartsstudio_01_0185.xml", "product_code":"dataartsstudio", - "code":"132", + "code":"137", "des":"If the source link of a job is an MRS Hudi link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From MRS Hudi,Source Job Parameters,User Guide", + "kw":"From MRS Hudi,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2787,15 +2895,15 @@ "uri":"dataartsstudio_01_0286.html", "node_id":"dataartsstudio_01_0286.xml", "product_code":"dataartsstudio", - "code":"133", + "code":"138", "des":"If the source link of a job is an MRS ClickHouse link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From MRS ClickHouse,Source Job Parameters,User Guide", + "kw":"From MRS ClickHouse,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2805,18 +2913,39 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0291.html", - "node_id":"dataartsstudio_01_0291.xml", + "uri":"dataartsstudio_01_0289.html", + "node_id":"dataartsstudio_01_0289.xml", "product_code":"dataartsstudio", - "code":"134", - "des":"If the source link of a job is a ShenTong database link, configure the source job parameters based on Table 1.", + "code":"139", + "des":"If the source link of a job is a LogHub (SLS) link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From a ShenTong Database,Source Job Parameters,User Guide", + "kw":"From LogHub (SLS),Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"From LogHub (SLS)", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0291.html", + "node_id":"dataartsstudio_01_0291.xml", + "product_code":"dataartsstudio", + "code":"140", + "des":"If the source link of a job is a ShenTong database link, configure the source job parameters based on Table 1.", + "doc_type":"usermanual", + "kw":"From a ShenTong Database,Configuring CDM Source Job Parameters,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2826,60 +2955,60 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0136.html", - "node_id":"dataartsstudio_01_0136.xml", + "uri":"dataartsstudio_01_1629.html", + "node_id":"dataartsstudio_01_1629.xml", "product_code":"dataartsstudio", - "code":"135", - "des":"If the source link of a job is a Doris link, configure the source job parameters based on Table 1.", + "code":"141", + "des":"If the source link of a job is a YASHAN link, configure the source job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"From Doris,Source Job Parameters,User Guide", + "kw":"From YASHAN,Configuring CDM Source Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"From Doris", + "title":"From YASHAN", "githuburl":"" }, { "uri":"dataartsstudio_01_0061.html", "node_id":"dataartsstudio_01_0061.xml", "product_code":"dataartsstudio", - "code":"136", + "code":"142", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Destination Job Parameters", + "kw":"Configuring CDM Destination Job Parameters", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Destination Job Parameters", + "title":"Configuring CDM Destination Job Parameters", "githuburl":"" }, { "uri":"dataartsstudio_01_0062.html", "node_id":"dataartsstudio_01_0062.xml", "product_code":"dataartsstudio", - "code":"137", + "code":"143", "des":"If the destination link of a job is an OBS link, that is, data is to be imported to OBS, configure the destination job parameters based on Table 1.Advanced attributes are", "doc_type":"usermanual", - "kw":"To OBS,Destination Job Parameters,User Guide", + "kw":"To OBS,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2892,15 +3021,15 @@ "uri":"dataartsstudio_01_0063.html", "node_id":"dataartsstudio_01_0063.xml", "product_code":"dataartsstudio", - "code":"138", + "code":"144", "des":"If the destination link of a job is an HDFS link, configure the destination job parameters based on Table 1.HDFS supports the UTF-8 encoding only. Retain the default valu", "doc_type":"usermanual", - "kw":"To HDFS,Destination Job Parameters,User Guide", + "kw":"To HDFS,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2913,15 +3042,15 @@ "uri":"dataartsstudio_01_0064.html", "node_id":"dataartsstudio_01_0064.xml", "product_code":"dataartsstudio", - "code":"139", + "code":"145", "des":"If the destination link of a job is an HBase link or CloudTable link, configure the destination job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"To HBase/CloudTable,Destination Job Parameters,User Guide", + "kw":"To HBase/CloudTable,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2934,15 +3063,15 @@ "uri":"dataartsstudio_01_0066.html", "node_id":"dataartsstudio_01_0066.xml", "product_code":"dataartsstudio", - "code":"140", - "des":"If the destination link of a job is a Hive link, configure the destination job parameters based on Table 1.When Hive serves as the destination end, a table whose storage ", + "code":"146", + "des":"If the destination link of a job is a Hive link, configure the destination job parameters based on Table 1.If the source Hive contains both the array and map types of dat", "doc_type":"usermanual", - "kw":"To Hive,Destination Job Parameters,User Guide", + "kw":"To Hive,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2955,15 +3084,15 @@ "uri":"dataartsstudio_01_0068.html", "node_id":"dataartsstudio_01_0068.xml", "product_code":"dataartsstudio", - "code":"141", + "code":"147", "des":"Table 1 lists the destination job parameters when the destination link is an MySQL, SQL Server, or PostgreSQL link.", "doc_type":"usermanual", - "kw":"To MySQL/SQL Server/PostgreSQL,Destination Job Parameters,User Guide", + "kw":"To MySQL/SQL Server/PostgreSQL,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2976,15 +3105,15 @@ "uri":"dataartsstudio_01_0252.html", "node_id":"dataartsstudio_01_0252.xml", "product_code":"dataartsstudio", - "code":"142", + "code":"148", "des":"If the destination link of a job is an Oracle database link, configure the destination job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"To Oracle,Destination Job Parameters,User Guide", + "kw":"To Oracle,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -2997,15 +3126,15 @@ "uri":"dataartsstudio_01_1251.html", "node_id":"dataartsstudio_01_1251.xml", "product_code":"dataartsstudio", - "code":"143", + "code":"149", "des":"If the destination link of a job is a DWS link, configure the destination job parameters based on Table 1.Figure 1 describes the field mapping between DWS tables created ", "doc_type":"usermanual", - "kw":"To DWS,Destination Job Parameters,User Guide", + "kw":"To DWS,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3018,15 +3147,15 @@ "uri":"dataartsstudio_01_0069.html", "node_id":"dataartsstudio_01_0069.xml", "product_code":"dataartsstudio", - "code":"144", + "code":"150", "des":"If the destination link of a job is a DDS link, configure the destination job parameters based on Table 1.Parameter descriptionParameterDescriptionExample ValueDatabase N", "doc_type":"usermanual", - "kw":"To DDS,Destination Job Parameters,User Guide", + "kw":"To DDS,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3039,15 +3168,15 @@ "uri":"dataartsstudio_01_0070.html", "node_id":"dataartsstudio_01_0070.xml", "product_code":"dataartsstudio", - "code":"145", + "code":"151", "des":"Table 1 lists the destination job parameters when the destination link is a Redis link.Parameter descriptionParameterDescriptionExample ValueRedis Key PrefixKey prefix, w", "doc_type":"usermanual", - "kw":"To Redis,Destination Job Parameters,User Guide", + "kw":"To Redis,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3060,15 +3189,15 @@ "uri":"dataartsstudio_01_0071.html", "node_id":"dataartsstudio_01_0071.xml", "product_code":"dataartsstudio", - "code":"146", - "des":"If the destination link of a job is a link described in Link to Elasticsearch or Link to CSS, configure the destination job parameters based on Table 1.", + "code":"152", + "des":"If the destination link of a job is a link described in Elasticsearch Link Parameters or CSS Link Parameters, configure the destination job parameters based on Table 1.Th", "doc_type":"usermanual", - "kw":"To Elasticsearch/CSS,Destination Job Parameters,User Guide", + "kw":"To Elasticsearch/CSS,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3081,15 +3210,15 @@ "uri":"dataartsstudio_01_0072.html", "node_id":"dataartsstudio_01_0072.xml", "product_code":"dataartsstudio", - "code":"147", - "des":"If the destination link of a job is a DLI link, configure the destination job parameters based on Table 1.When you use CDM to migrate data to DLI, DLI generates data file", + "code":"153", + "des":"If the destination link of a job is a DLI link, configure the destination job parameters based on Table 1.When data is migrated to DLI using CDM, DLI generates data files", "doc_type":"usermanual", - "kw":"To DLI,Destination Job Parameters,User Guide", + "kw":"To DLI,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3102,15 +3231,15 @@ "uri":"dataartsstudio_01_0074.html", "node_id":"dataartsstudio_01_0074.xml", "product_code":"dataartsstudio", - "code":"148", + "code":"154", "des":"If the destination link of a job is a CloudTable OpenTSDB link, configure the destination job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"To OpenTSDB,Destination Job Parameters,User Guide", + "kw":"To OpenTSDB,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3123,15 +3252,15 @@ "uri":"dataartsstudio_01_0186.html", "node_id":"dataartsstudio_01_0186.xml", "product_code":"dataartsstudio", - "code":"149", + "code":"155", "des":"If the destination link of a job is an MRS Hudi link, configure the destination job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"To MRS Hudi,Destination Job Parameters,User Guide", + "kw":"To MRS Hudi,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3144,15 +3273,15 @@ "uri":"dataartsstudio_01_0287.html", "node_id":"dataartsstudio_01_0287.xml", "product_code":"dataartsstudio", - "code":"150", + "code":"156", "des":"If the destination link of a job is an MRS ClickHouse link, configure the destination job parameters based on Table 1.If the source link of the job is an MRS ClickHouse, ", "doc_type":"usermanual", - "kw":"To MRS ClickHouse,Destination Job Parameters,User Guide", + "kw":"To MRS ClickHouse,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3165,15 +3294,15 @@ "uri":"dataartsstudio_01_0332.html", "node_id":"dataartsstudio_01_0332.xml", "product_code":"dataartsstudio", - "code":"151", + "code":"157", "des":"If the destination link of a job is a MongoDB link, configure the destination job parameters based on Table 1.", "doc_type":"usermanual", - "kw":"To MongoDB,Destination Job Parameters,User Guide", + "kw":"To MongoDB,Configuring CDM Destination Job Parameters,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3182,137 +3311,137 @@ "title":"To MongoDB", "githuburl":"" }, - { - "uri":"dataartsstudio_01_0999.html", - "node_id":"dataartsstudio_01_0999.xml", - "product_code":"dataartsstudio", - "code":"152", - "des":"Table 1 lists the destination job parameters when the destination link is a Doris link.", - "doc_type":"usermanual", - "kw":"To Doris,Destination Job Parameters,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsBot":"No;yes", - "IsMulti":"No;no", - "documenttype":"usermanual", - "prodname":"dataartsstudio" - } - ], - "title":"To Doris", - "githuburl":"" - }, { "uri":"dataartsstudio_01_0261.html", "node_id":"dataartsstudio_01_0261.xml", "product_code":"dataartsstudio", - "code":"153", + "code":"158", "des":"After the job parameters are configured, you can configure field mapping. You can click on the Map Field page to customize new fields or click in the Operation column t", "doc_type":"usermanual", - "kw":"Configuring Field Mapping,Managing Jobs,User Guide", + "kw":"Configuring CDM Job Field Mapping,Creating a Job in a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Configuring Field Mapping", + "title":"Configuring CDM Job Field Mapping", "githuburl":"" }, { "uri":"dataartsstudio_01_0082.html", "node_id":"dataartsstudio_01_0082.xml", "product_code":"dataartsstudio", - "code":"154", + "code":"159", "des":"CDM supports scheduled execution of table/file migration jobs by minute, hour, day, week, and month. This section describes how to configure scheduled job parameters.When", "doc_type":"usermanual", - "kw":"Scheduling Job Execution,Managing Jobs,User Guide", + "kw":"Configuring a Scheduled CDM Job,Creating a Job in a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Scheduling Job Execution", + "title":"Configuring a Scheduled CDM Job", "githuburl":"" }, { "uri":"dataartsstudio_01_0083.html", "node_id":"dataartsstudio_01_0083.xml", "product_code":"dataartsstudio", - "code":"155", + "code":"160", "des":"On the Settings tab page, you can perform the following operations:Maximum Concurrent ExtractorsScheduled Backup/RestorationEnvironment Variables of Job ParametersMaximum", "doc_type":"usermanual", - "kw":"Job Configuration Management,Managing Jobs,User Guide", + "kw":"Managing CDM Job Configuration,Creating a Job in a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Job Configuration Management", + "title":"Managing CDM Job Configuration", "githuburl":"" }, { "uri":"dataartsstudio_01_0084.html", "node_id":"dataartsstudio_01_0084.xml", "product_code":"dataartsstudio", - "code":"156", + "code":"161", "des":"Existing CDM jobs can be viewed, modified, deleted, started, and stopped. This section describes how to view and modify a job.Viewing job statusThe job status can be New,", "doc_type":"usermanual", - "kw":"Managing a Single Job,Managing Jobs,User Guide", + "kw":"Managing a CDM Job,Creating a Job in a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Managing a Single Job", + "title":"Managing a CDM Job", "githuburl":"" }, { "uri":"dataartsstudio_01_0085.html", "node_id":"dataartsstudio_01_0085.xml", "product_code":"dataartsstudio", - "code":"157", - "des":"This section describes how to manage CDM table/file migration jobs in batches. The following operations are involved:Manage jobs by group.Run jobs in batches.Delete jobs ", + "code":"162", + "des":"This section describes how to manage CDM table/file migration jobs in batches. The following operations are supported:Managing jobs by groupRunning jobs in batchesDeletin", "doc_type":"usermanual", - "kw":"Managing Jobs in Batches,Managing Jobs,User Guide", + "kw":"Managing CDM Jobs,Creating a Job in a CDM Cluster,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Managing Jobs in Batches", + "title":"Managing CDM Jobs", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_0114.html", + "node_id":"dataartsstudio_01_0114.xml", + "product_code":"dataartsstudio", + "code":"163", + "des":"During the creation of table/file migration jobs, CDM supports the macro variables of date and time in the following parameters of the source and destination links:Source", + "doc_type":"usermanual", + "kw":"Using Macro Variables of Date and Time,DataArts Migration (CDM Jobs),User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Using Macro Variables of Date and Time", "githuburl":"" }, { "uri":"dataartsstudio_01_0018.html", "node_id":"dataartsstudio_01_0018.xml", "product_code":"dataartsstudio", - "code":"158", + "code":"164", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Improving Migration Performance", @@ -3320,7 +3449,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3333,7 +3462,7 @@ "uri":"dataartsstudio_01_0025.html", "node_id":"dataartsstudio_01_0025.xml", "product_code":"dataartsstudio", - "code":"159", + "code":"165", "des":"Figure 1 shows the simplified migration model used by CDM.CDM migrates data through data migration jobs. It works in the following way:When data migration jobs are submit", "doc_type":"usermanual", "kw":"How Migration Jobs Work,Improving Migration Performance,User Guide", @@ -3341,7 +3470,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3354,7 +3483,7 @@ "uri":"dataartsstudio_01_0076.html", "node_id":"dataartsstudio_01_0076.xml", "product_code":"dataartsstudio", - "code":"160", + "code":"166", "des":"In addition to increasing the source read speed, improving the destination write performance, and increasing the bandwidth, you can accelerate migration using the followi", "doc_type":"usermanual", "kw":"Performance Tuning,Improving Migration Performance,User Guide", @@ -3362,7 +3491,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3375,7 +3504,7 @@ "uri":"dataartsstudio_01_0078.html", "node_id":"dataartsstudio_01_0078.xml", "product_code":"dataartsstudio", - "code":"161", + "code":"167", "des":"CDM splits jobs for different data sources based on different dimensions. Table 1 lists the splitting dimensions.", "doc_type":"usermanual", "kw":"Reference: Job Splitting Dimensions,Improving Migration Performance,User Guide", @@ -3383,7 +3512,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3396,7 +3525,7 @@ "uri":"dataartsstudio_01_0077.html", "node_id":"dataartsstudio_01_0077.xml", "product_code":"dataartsstudio", - "code":"162", + "code":"168", "des":"The performance metrics provided in this document are for reference only. The performance at your site may be affected by factors such as the data source performance at t", "doc_type":"usermanual", "kw":"Reference: CDM Performance Test Data,Improving Migration Performance,User Guide", @@ -3404,7 +3533,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3417,7 +3546,7 @@ "uri":"dataartsstudio_01_0110.html", "node_id":"dataartsstudio_01_0110.xml", "product_code":"dataartsstudio", - "code":"163", + "code":"169", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Key Operation Guide", @@ -3425,7 +3554,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3438,7 +3567,7 @@ "uri":"dataartsstudio_01_0111.html", "node_id":"dataartsstudio_01_0111.xml", "product_code":"dataartsstudio", - "code":"164", + "code":"170", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Incremental Migration", @@ -3446,7 +3575,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3459,7 +3588,7 @@ "uri":"dataartsstudio_01_0112.html", "node_id":"dataartsstudio_01_0112.xml", "product_code":"dataartsstudio", - "code":"165", + "code":"171", "des":"CDM supports incremental migration of file systems. After full migration is complete, all new files or only specified directories or files can be exported.Currently, CDM ", "doc_type":"usermanual", "kw":"Incremental File Migration,Incremental Migration,User Guide", @@ -3467,7 +3596,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3480,7 +3609,7 @@ "uri":"dataartsstudio_01_0113.html", "node_id":"dataartsstudio_01_0113.xml", "product_code":"dataartsstudio", - "code":"166", + "code":"172", "des":"CDM supports incremental migration of relational databases. After a full migration is complete, data in a specified period can be incrementally migrated. For example, dat", "doc_type":"usermanual", "kw":"Incremental Migration of Relational Databases,Incremental Migration,User Guide", @@ -3488,7 +3617,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3498,10 +3627,10 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0115_0.html", - "node_id":"dataartsstudio_01_0115_0.xml", + "uri":"dataartsstudio_01_0137.html", + "node_id":"dataartsstudio_01_0137.xml", "product_code":"dataartsstudio", - "code":"167", + "code":"173", "des":"You can use CDM to export data in a specified period of time from HBase (including MRS HBase, FusionInsight HBase, and Apache HBase) and CloudTable. The CDM scheduled job", "doc_type":"usermanual", "kw":"HBase/CloudTable Incremental Migration,Incremental Migration,User Guide", @@ -3509,7 +3638,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3522,7 +3651,7 @@ "uri":"dataartsstudio_01_0125.html", "node_id":"dataartsstudio_01_0125.xml", "product_code":"dataartsstudio", - "code":"168", + "code":"174", "des":"By using CDM, you can export MongoDB or DDS data within a specified period. With the scheduled jobs of CDM, you can implement incremental migration of MongoDB and DDS.If ", "doc_type":"usermanual", "kw":"MongoDB/DDS Incremental Migration,Incremental Migration,User Guide", @@ -3530,7 +3659,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3540,31 +3669,10 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0114.html", - "node_id":"dataartsstudio_01_0114.xml", + "uri":"dataartsstudio_01_0589.html", + "node_id":"dataartsstudio_01_0589.xml", "product_code":"dataartsstudio", - "code":"169", - "des":"During the creation of table/file migration jobs, CDM supports the macro variables of date and time in the following parameters of the source and destination links:Source", - "doc_type":"usermanual", - "kw":"Using Macro Variables of Date and Time,Key Operation Guide,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsBot":"No;yes", - "IsMulti":"No;no", - "documenttype":"usermanual", - "prodname":"dataartsstudio" - } - ], - "title":"Using Macro Variables of Date and Time", - "githuburl":"" - }, - { - "uri":"dataartsstudio_01_0116_0.html", - "node_id":"dataartsstudio_01_0116_0.xml", - "product_code":"dataartsstudio", - "code":"170", + "code":"175", "des":"When a CDM job fails to be executed, CDM rolls back the data to the state before the job starts and automatically deletes data from the destination table.Parameter positi", "doc_type":"usermanual", "kw":"Migration in Transaction Mode,Key Operation Guide,User Guide", @@ -3572,7 +3680,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3582,10 +3690,10 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0117_0.html", - "node_id":"dataartsstudio_01_0117_0.xml", + "uri":"dataartsstudio_01_0590.html", + "node_id":"dataartsstudio_01_0590.xml", "product_code":"dataartsstudio", - "code":"171", + "code":"176", "des":"When you migrate files to a file system, CDM can encrypt and decrypt those files. Currently, CDM supports the following encryption modes:AES-256-GCMKMS EncryptionAES-256-", "doc_type":"usermanual", "kw":"Encryption and Decryption During File Migration,Key Operation Guide,User Guide", @@ -3593,7 +3701,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3603,10 +3711,10 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0118_0.html", - "node_id":"dataartsstudio_01_0118_0.xml", + "uri":"dataartsstudio_01_0591.html", + "node_id":"dataartsstudio_01_0591.xml", "product_code":"dataartsstudio", - "code":"172", + "code":"177", "des":"CDM extracts data from the migration source and writes the data to the migration destination. Figure 1 shows the migration mode when files are migrated to OBS.During the ", "doc_type":"usermanual", "kw":"MD5 Verification,Key Operation Guide,User Guide", @@ -3614,7 +3722,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3627,7 +3735,7 @@ "uri":"dataartsstudio_01_0104.html", "node_id":"dataartsstudio_01_0104.xml", "product_code":"dataartsstudio", - "code":"173", + "code":"178", "des":"After the job parameters are configured, field mapping needs to be configured. You can click in the Operation column to create a field converter.If files are migrated be", "doc_type":"usermanual", "kw":"Configuring Field Converters,Key Operation Guide,User Guide", @@ -3635,7 +3743,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3648,7 +3756,7 @@ "uri":"dataartsstudio_01_0304.html", "node_id":"dataartsstudio_01_0304.xml", "product_code":"dataartsstudio", - "code":"174", + "code":"179", "des":"After job parameters are configured, field mapping needs to be configured. You can customize new fields by clicking on the Map Field page.If files are migrated between F", "doc_type":"usermanual", "kw":"Adding Fields,Key Operation Guide,User Guide", @@ -3656,7 +3764,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3666,10 +3774,10 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0105.html", - "node_id":"dataartsstudio_01_0105.xml", + "uri":"dataartsstudio_01_0592.html", + "node_id":"dataartsstudio_01_0592.xml", "product_code":"dataartsstudio", - "code":"175", + "code":"180", "des":"You can migrate files (a maximum of 50) with specified names from FTP, OBS, or SFTP at a time. The exported files can only be written to the same directory on the migrati", "doc_type":"usermanual", "kw":"Migrating Files with Specified Names,Key Operation Guide,User Guide", @@ -3677,7 +3785,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3687,10 +3795,10 @@ "githuburl":"" }, { - "uri":"dataartsstudio_01_0106.html", - "node_id":"dataartsstudio_01_0106.xml", + "uri":"dataartsstudio_01_0593.html", + "node_id":"dataartsstudio_01_0593.xml", "product_code":"dataartsstudio", - "code":"176", + "code":"181", "des":"During table/file migration, CDM uses delimiters to separate fields in CSV files. However, delimiters cannot be used in complex semi-structured data because the field val", "doc_type":"usermanual", "kw":"Regular Expressions for Separating Semi-structured Text,Key Operation Guide,User Guide", @@ -3698,7 +3806,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3711,7 +3819,7 @@ "uri":"dataartsstudio_01_0109.html", "node_id":"dataartsstudio_01_0109.xml", "product_code":"dataartsstudio", - "code":"177", + "code":"182", "des":"When you create a job on the CDM console to migrate tables or files of a relational database, you can add a field to record the time when they were written to the databas", "doc_type":"usermanual", "kw":"Recording the Time When Data Is Written to the Database,Key Operation Guide,User Guide", @@ -3719,7 +3827,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3732,7 +3840,7 @@ "uri":"dataartsstudio_01_0108.html", "node_id":"dataartsstudio_01_0108.xml", "product_code":"dataartsstudio", - "code":"178", + "code":"183", "des":"When creating a CDM job, you need to specify File Format in the job parameters of the migration source and destination in some scenarios. This section describes the appli", "doc_type":"usermanual", "kw":"File Formats,Key Operation Guide,User Guide", @@ -3740,7 +3848,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3753,7 +3861,7 @@ "uri":"dataartsstudio_01_0209.html", "node_id":"dataartsstudio_01_0209.xml", "product_code":"dataartsstudio", - "code":"179", + "code":"184", "des":"When field mapping is configured on CDM, a message is displayed indicating that the data type of the field is not supported and the field needs to be deleted. If you need", "doc_type":"usermanual", "kw":"Converting Unsupported Data Types,Key Operation Guide,User Guide", @@ -3761,7 +3869,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3774,15 +3882,15 @@ "uri":"dataartsstudio_01_2000.html", "node_id":"dataartsstudio_01_2000.xml", "product_code":"dataartsstudio", - "code":"180", - "des":"Figure 1 describes the field mapping between the DWS tables created by CDM and source tables. For example, if you use CDM to migrate the Oracle database to DWS, CDM autom", + "code":"185", + "des":"CDM converts the field type of the source to the field type of the destination based on the default rule and creates a table at the destination.Figure 1 describes the fie", "doc_type":"usermanual", "kw":"Auto Table Creation,Key Operation Guide,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3795,7 +3903,7 @@ "uri":"dataartsstudio_01_0086.html", "node_id":"dataartsstudio_01_0086.xml", "product_code":"dataartsstudio", - "code":"181", + "code":"186", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Tutorials", @@ -3803,7 +3911,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3816,7 +3924,7 @@ "uri":"dataartsstudio_01_0130.html", "node_id":"dataartsstudio_01_0130.xml", "product_code":"dataartsstudio", - "code":"182", + "code":"187", "des":"MRS Hive links are applicable to the MapReduce Service (MRS). This tutorial describes how to create an MRS Hive link.You have created a CDM cluster.You have obtained the ", "doc_type":"usermanual", "kw":"Creating an MRS Hive Link,Tutorials,User Guide", @@ -3824,7 +3932,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3837,7 +3945,7 @@ "uri":"dataartsstudio_01_0131.html", "node_id":"dataartsstudio_01_0131.xml", "product_code":"dataartsstudio", - "code":"183", + "code":"188", "des":"MySQL links are applicable to third-party cloud MySQL services and MySQL created in a local data center or ECS. This tutorial describes how to create a MySQL link.You hav", "doc_type":"usermanual", "kw":"Creating a MySQL Link,Tutorials,User Guide", @@ -3845,7 +3953,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3858,7 +3966,7 @@ "uri":"dataartsstudio_01_0092.html", "node_id":"dataartsstudio_01_0092.xml", "product_code":"dataartsstudio", - "code":"184", + "code":"189", "des":"MRS provides enterprise-level big data clusters on the cloud. It contains HDFS, Hive, and Spark components and is applicable to massive data analysis of enterprises.Hive ", "doc_type":"usermanual", "kw":"Migrating Data from MySQL to MRS Hive,Tutorials,User Guide", @@ -3866,7 +3974,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3879,7 +3987,7 @@ "uri":"dataartsstudio_01_0100.html", "node_id":"dataartsstudio_01_0100.xml", "product_code":"dataartsstudio", - "code":"185", + "code":"190", "des":"CDM supports table-to-OBS data migration. This section describes how to migrate tables from a MySQL database to OBS. The process is as follows:Creating a CDM Cluster and ", "doc_type":"usermanual", "kw":"Migrating Data from MySQL to OBS,Tutorials,User Guide", @@ -3887,7 +3995,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3900,7 +4008,7 @@ "uri":"dataartsstudio_01_0101.html", "node_id":"dataartsstudio_01_0101.xml", "product_code":"dataartsstudio", - "code":"186", + "code":"191", "des":"CDM supports table-to-table data migration. This section describes how to migrate data from MySQL to DWS. The process is as follows:Creating a CDM Cluster and Binding an ", "doc_type":"usermanual", "kw":"Migrating Data from MySQL to DWS,Tutorials,User Guide", @@ -3908,7 +4016,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3921,7 +4029,7 @@ "uri":"dataartsstudio_01_0098.html", "node_id":"dataartsstudio_01_0098.xml", "product_code":"dataartsstudio", - "code":"187", + "code":"192", "des":"This section describes how to migrate the entire on-premises MySQL database to RDS using the CDM's entire DB migration function.Currently, CDM can migrate the entire on-p", "doc_type":"usermanual", "kw":"Migrating an Entire MySQL Database to RDS,Tutorials,User Guide", @@ -3929,7 +4037,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3942,7 +4050,7 @@ "uri":"dataartsstudio_01_0091.html", "node_id":"dataartsstudio_01_0091.xml", "product_code":"dataartsstudio", - "code":"188", + "code":"193", "des":"Cloud Search Service provides users with structured and unstructured data search, statistics, and report capabilities. This section describes how to use CDM to migrate da", "doc_type":"usermanual", "kw":"Migrating Data from Oracle to CSS,Tutorials,User Guide", @@ -3950,7 +4058,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3963,7 +4071,7 @@ "uri":"dataartsstudio_01_0133.html", "node_id":"dataartsstudio_01_0133.xml", "product_code":"dataartsstudio", - "code":"189", + "code":"194", "des":"CDM supports table-to-table migration. This section describes how to use CDM to migrate data from Oracle to Data Warehouse Service (DWS). The procedure is as follows:Crea", "doc_type":"usermanual", "kw":"Migrating Data from Oracle to DWS,Tutorials,User Guide", @@ -3971,7 +4079,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -3984,7 +4092,7 @@ "uri":"dataartsstudio_01_0088.html", "node_id":"dataartsstudio_01_0088.xml", "product_code":"dataartsstudio", - "code":"190", + "code":"195", "des":"CDM supports data migration between cloud services. This section describes how to use CDM to migrate data from OBS to CSS. The procedure is as follows:Creating a CDM Clus", "doc_type":"usermanual", "kw":"Migrating Data from OBS to CSS,Tutorials,User Guide", @@ -3992,7 +4100,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4005,7 +4113,7 @@ "uri":"dataartsstudio_01_0089.html", "node_id":"dataartsstudio_01_0089.xml", "product_code":"dataartsstudio", - "code":"191", + "code":"196", "des":"DLI is a fully hosted big data query service. This section describes how to use CDM to migrate data from OBS to DLI. The procedure includes four steps:Creating a CDM Clus", "doc_type":"usermanual", "kw":"Migrating Data from OBS to DLI,Tutorials,User Guide", @@ -4013,7 +4121,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4026,7 +4134,7 @@ "uri":"dataartsstudio_01_0103.html", "node_id":"dataartsstudio_01_0103.xml", "product_code":"dataartsstudio", - "code":"192", + "code":"197", "des":"CDM supports file-to-file data migration. This section describes how to migrate data from MRS HDFS to OBS. The process is as follows:Creating a CDM Cluster and Binding an", "doc_type":"usermanual", "kw":"Migrating Data from MRS HDFS to OBS,Tutorials,User Guide", @@ -4034,7 +4142,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4047,7 +4155,7 @@ "uri":"dataartsstudio_01_0099.html", "node_id":"dataartsstudio_01_0099.xml", "product_code":"dataartsstudio", - "code":"193", + "code":"198", "des":"CSS provides users with structured and unstructured data search, statistics, and report capabilities. This section describes how to use CDM to migrate the entire Elastics", "doc_type":"usermanual", "kw":"Migrating the Entire Elasticsearch Database to CSS,Tutorials,User Guide", @@ -4055,7 +4163,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4068,7 +4176,7 @@ "uri":"dataartsstudio_01_0400.html", "node_id":"dataartsstudio_01_0400.xml", "product_code":"dataartsstudio", - "code":"194", + "code":"199", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"DataArts Factory", @@ -4076,7 +4184,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4089,7 +4197,7 @@ "uri":"dataartsstudio_01_0401.html", "node_id":"dataartsstudio_01_0401.xml", "product_code":"dataartsstudio", - "code":"195", + "code":"200", "des":"DataArts Factory is a one-stop big data collaborative development platform that provides fully managed big data scheduling capabilities. It manages various big data servi", "doc_type":"usermanual", "kw":"Overview,DataArts Factory,User Guide", @@ -4097,7 +4205,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4110,7 +4218,7 @@ "uri":"dataartsstudio_01_0403.html", "node_id":"dataartsstudio_01_0403.xml", "product_code":"dataartsstudio", - "code":"196", + "code":"201", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Data Management", @@ -4118,7 +4226,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4131,7 +4239,7 @@ "uri":"dataartsstudio_01_0402.html", "node_id":"dataartsstudio_01_0402.xml", "product_code":"dataartsstudio", - "code":"197", + "code":"202", "des":"The data management function helps you quickly establish data models and provides you with data entities for script and job development. With data management, you can:Man", "doc_type":"usermanual", "kw":"Data Management Process,Data Management,User Guide", @@ -4139,7 +4247,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4152,15 +4260,15 @@ "uri":"dataartsstudio_01_0404.html", "node_id":"dataartsstudio_01_0404.xml", "product_code":"dataartsstudio", - "code":"198", - "des":"After a data connection is created, you can perform data operations on DataArts Factory, for example, managing databases, namespaces, database schema, and tables.With one", + "code":"203", + "des":"After creating a data connection, you can perform data operations on DataArts Factory, for example, managing databases, namespaces, database schema, and tables.With one d", "doc_type":"usermanual", "kw":"Creating a Data Connection,Data Management,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4173,7 +4281,7 @@ "uri":"dataartsstudio_01_0405.html", "node_id":"dataartsstudio_01_0405.xml", "product_code":"dataartsstudio", - "code":"199", + "code":"204", "des":"After creating a data connection, you can create a database on the console or using a SQL script.(Recommended) Console: You can directly create a database on the DataArts", "doc_type":"usermanual", "kw":"Creating a Database,Data Management,User Guide", @@ -4181,7 +4289,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4194,15 +4302,15 @@ "uri":"dataartsstudio_01_0412.html", "node_id":"dataartsstudio_01_0412.xml", "product_code":"dataartsstudio", - "code":"200", - "des":"After creating a DWS data connection, you can manage the database schemas under the DWS data connection.A DWS data connection has been created. For details, see Creating ", + "code":"205", + "des":"After creating a DWS data connection, you can manage the database schemas under the DWS data connection.If existing database schemas meet your requirements, skip this sec", "doc_type":"usermanual", "kw":"(Optional) Creating a Database Schema,Data Management,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4215,7 +4323,7 @@ "uri":"dataartsstudio_01_0416.html", "node_id":"dataartsstudio_01_0416.xml", "product_code":"dataartsstudio", - "code":"201", + "code":"206", "des":"You can create a table on the DataArts Factory console, in DDL mode, or using a SQL script.(Recommended) Console: You can directly create a table on the DataArts Studio D", "doc_type":"usermanual", "kw":"Creating a Table,Data Management,User Guide", @@ -4223,7 +4331,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4236,7 +4344,7 @@ "uri":"dataartsstudio_01_0421.html", "node_id":"dataartsstudio_01_0421.xml", "product_code":"dataartsstudio", - "code":"202", + "code":"207", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Script Development", @@ -4244,7 +4352,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4257,7 +4365,7 @@ "uri":"dataartsstudio_01_0422.html", "node_id":"dataartsstudio_01_0422.xml", "product_code":"dataartsstudio", - "code":"203", + "code":"208", "des":"The script development function provides the following capabilities:Provides an online script editor for developing and debugging SQL, Python, and Shell scripts.Supports ", "doc_type":"usermanual", "kw":"Script Development Process,Script Development,User Guide", @@ -4265,7 +4373,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4278,7 +4386,7 @@ "uri":"dataartsstudio_01_0423.html", "node_id":"dataartsstudio_01_0423.xml", "product_code":"dataartsstudio", - "code":"204", + "code":"209", "des":"DataArts Factory allows you to create, edit, debug, and run SQL, Python, and Shell scripts. Before developing a script, you must create one.You have completed operations ", "doc_type":"usermanual", "kw":"Creating a Script,Script Development,User Guide", @@ -4286,7 +4394,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4299,7 +4407,7 @@ "uri":"dataartsstudio_01_0406.html", "node_id":"dataartsstudio_01_0406.xml", "product_code":"dataartsstudio", - "code":"205", + "code":"210", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Developing Scripts", @@ -4307,7 +4415,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4320,7 +4428,7 @@ "uri":"dataartsstudio_01_0424.html", "node_id":"dataartsstudio_01_0424.xml", "product_code":"dataartsstudio", - "code":"206", + "code":"211", "des":"DataArts Factory allows you to develop, debug, and run SQL scripts online. You can run developed scripts in jobs. For details, see Developing a Pipeline Job.DataArts Fact", "doc_type":"usermanual", "kw":"Developing an SQL Script,Developing Scripts,User Guide", @@ -4328,7 +4436,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4341,7 +4449,7 @@ "uri":"dataartsstudio_01_0425.html", "node_id":"dataartsstudio_01_0425.xml", "product_code":"dataartsstudio", - "code":"207", + "code":"212", "des":"DataArts Factory allows you to develop, debug, and run Shell scripts online. You can run developed scripts in jobs. For details, see Developing a Pipeline Job.A shell scr", "doc_type":"usermanual", "kw":"Developing a Shell Script,Developing Scripts,User Guide", @@ -4349,7 +4457,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4362,7 +4470,7 @@ "uri":"dataartsstudio_01_4503.html", "node_id":"dataartsstudio_01_4503.xml", "product_code":"dataartsstudio", - "code":"208", + "code":"213", "des":"DataArts Factory allows you to develop, debug, and run Python scripts online. You can run developed scripts in jobs. For details, see Developing a Pipeline Job.For detail", "doc_type":"usermanual", "kw":"Developing a Python Script,Developing Scripts,User Guide", @@ -4370,7 +4478,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4383,7 +4491,7 @@ "uri":"dataartsstudio_01_0901.html", "node_id":"dataartsstudio_01_0901.xml", "product_code":"dataartsstudio", - "code":"209", + "code":"214", "des":"Submitting a version depends on the version management function of DataArts Factory.Version management traces script and job changes, and supports version comparison and ", "doc_type":"usermanual", "kw":"Submitting a Version,Script Development,User Guide", @@ -4391,7 +4499,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4404,7 +4512,7 @@ "uri":"dataartsstudio_01_1902.html", "node_id":"dataartsstudio_01_1902.xml", "product_code":"dataartsstudio", - "code":"210", + "code":"215", "des":"In enterprise mode, when a developer submits a script version, the system generates a script release task. After the developer confirms releasing a package and the admin,", "doc_type":"usermanual", "kw":"Releasing a Script Task,Script Development,User Guide", @@ -4412,7 +4520,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4425,7 +4533,7 @@ "uri":"dataartsstudio_01_0407.html", "node_id":"dataartsstudio_01_0407.xml", "product_code":"dataartsstudio", - "code":"211", + "code":"216", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"(Optional) Managing Scripts", @@ -4433,7 +4541,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4446,7 +4554,7 @@ "uri":"dataartsstudio_01_0430.html", "node_id":"dataartsstudio_01_0430.xml", "product_code":"dataartsstudio", - "code":"212", + "code":"217", "des":"This section describes how to copy a script.A script has been developed based on Developing Scripts.Log in to the DataArts Studio console by following the instructions in", "doc_type":"usermanual", "kw":"Copying a Script,(Optional) Managing Scripts,User Guide", @@ -4454,7 +4562,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4467,7 +4575,7 @@ "uri":"dataartsstudio_01_0426.html", "node_id":"dataartsstudio_01_0426.xml", "product_code":"dataartsstudio", - "code":"213", + "code":"218", "des":"You can copy the name of a script and rename a script.A script has been developed based on Developing Scripts.Log in to the DataArts Studio console by following the instr", "doc_type":"usermanual", "kw":"Copying the Script Name and Renaming a Script,(Optional) Managing Scripts,User Guide", @@ -4475,7 +4583,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4488,7 +4596,7 @@ "uri":"dataartsstudio_01_0427.html", "node_id":"dataartsstudio_01_0427.xml", "product_code":"dataartsstudio", - "code":"214", + "code":"219", "des":"You can move a script file from one directory to another or move a script directory to another directory.A script has been developed based on Developing Scripts.Log in to", "doc_type":"usermanual", "kw":"Moving a Script or Script Directory,(Optional) Managing Scripts,User Guide", @@ -4496,7 +4604,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4509,7 +4617,7 @@ "uri":"dataartsstudio_01_0428.html", "node_id":"dataartsstudio_01_0428.xml", "product_code":"dataartsstudio", - "code":"215", + "code":"220", "des":"You can export one or more script files from the script directory. The exported files store the latest content in the development state.Log in to the DataArts Studio cons", "doc_type":"usermanual", "kw":"Exporting and Importing Scripts,(Optional) Managing Scripts,User Guide", @@ -4517,7 +4625,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4530,7 +4638,7 @@ "uri":"dataartsstudio_01_0471.html", "node_id":"dataartsstudio_01_0471.xml", "product_code":"dataartsstudio", - "code":"216", + "code":"221", "des":"This section describes how to view the references of a script or all the scripts in a folder.A script has been developed based on Developing Scripts.Log in to the DataArt", "doc_type":"usermanual", "kw":"Viewing Script References,(Optional) Managing Scripts,User Guide", @@ -4538,7 +4646,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4551,15 +4659,15 @@ "uri":"dataartsstudio_01_0429.html", "node_id":"dataartsstudio_01_0429.xml", "product_code":"dataartsstudio", - "code":"217", - "des":"If you do not need to use a script any more, perform the following operations to delete it.When you delete a script, the system checks whether the script is being referen", + "code":"222", + "des":"If you do not need to use a script any longer, perform the following operations to delete it.When you delete a script, the system checks whether the script is being refer", "doc_type":"usermanual", "kw":"Deleting a Script,(Optional) Managing Scripts,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4572,7 +4680,7 @@ "uri":"dataartsstudio_01_0912.html", "node_id":"dataartsstudio_01_0912.xml", "product_code":"dataartsstudio", - "code":"218", + "code":"223", "des":"Script and job unlocking depends on the lock function of DataArts Factory.The lock function prevents conflict caused by collaborative script or job development. If you cr", "doc_type":"usermanual", "kw":"Unlocking a Script,(Optional) Managing Scripts,User Guide", @@ -4580,7 +4688,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4593,7 +4701,7 @@ "uri":"dataartsstudio_01_1102.html", "node_id":"dataartsstudio_01_1102.xml", "product_code":"dataartsstudio", - "code":"219", + "code":"224", "des":"DataArts Factory allows you to change the script owner with a few clicks.Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Stu", "doc_type":"usermanual", "kw":"Changing the Script Owner,(Optional) Managing Scripts,User Guide", @@ -4601,7 +4709,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4614,7 +4722,7 @@ "uri":"dataartsstudio_01_1107.html", "node_id":"dataartsstudio_01_1107.xml", "product_code":"dataartsstudio", - "code":"220", + "code":"225", "des":"This section describes how to unlock scripts in batches.Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Cons", "doc_type":"usermanual", "kw":"Unlocking Scripts,(Optional) Managing Scripts,User Guide", @@ -4622,7 +4730,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4635,7 +4743,7 @@ "uri":"dataartsstudio_01_0431.html", "node_id":"dataartsstudio_01_0431.xml", "product_code":"dataartsstudio", - "code":"221", + "code":"226", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Job Development", @@ -4643,7 +4751,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4656,7 +4764,7 @@ "uri":"dataartsstudio_01_0432.html", "node_id":"dataartsstudio_01_0432.xml", "product_code":"dataartsstudio", - "code":"222", + "code":"227", "des":"The job development function provides the following capabilities:Provides a graphical designer that allows you to quickly build a data processing workflow by drag-and-dro", "doc_type":"usermanual", "kw":"Job Development Process,Job Development,User Guide", @@ -4664,7 +4772,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4677,15 +4785,15 @@ "uri":"dataartsstudio_01_0434.html", "node_id":"dataartsstudio_01_0434.xml", "product_code":"dataartsstudio", - "code":"223", - "des":"A job is composed of one or more nodes that are performed collaboratively to complete data operations. Before developing a job, create a new one.Each workspace can hold a", + "code":"228", + "des":"A job is composed of one or more nodes that are performed collaboratively to complete data operations. Before developing a job, create a new one.A workspace can contain a", "doc_type":"usermanual", "kw":"Creating a Job,Job Development,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4698,7 +4806,7 @@ "uri":"dataartsstudio_01_0435.html", "node_id":"dataartsstudio_01_0435.xml", "product_code":"dataartsstudio", - "code":"224", + "code":"229", "des":"This section describes how to develop and configure a job.For details about how to develop a batch processing job or real-time processing job in pipeline mode, see Compil", "doc_type":"usermanual", "kw":"Developing a Pipeline Job,Job Development,User Guide", @@ -4706,7 +4814,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4719,7 +4827,7 @@ "uri":"dataartsstudio_01_1436.html", "node_id":"dataartsstudio_01_1436.xml", "product_code":"dataartsstudio", - "code":"225", + "code":"230", "des":"This section describes how to develop and configure a job.For details about how to develop a batch processing job in single-task mode, see sections Developing an SQL Scri", "doc_type":"usermanual", "kw":"Developing a Batch Processing Single-Task SQL Job,Job Development,User Guide", @@ -4727,7 +4835,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4740,57 +4848,57 @@ "uri":"dataartsstudio_01_1823.html", "node_id":"dataartsstudio_01_1823.xml", "product_code":"dataartsstudio", - "code":"226", + "code":"231", "des":"This section describes how to develop and configure a job.For details about how to develop a real-time processing Flink SQL job in single-task mode, see sections Developi", "doc_type":"usermanual", - "kw":"Developing a Real-Time Processing Single-Task Flink SQL Job,Job Development,User Guide", + "kw":"Developing a Real-Time Processing Single-Task MRS Flink SQL Job,Job Development,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Developing a Real-Time Processing Single-Task Flink SQL Job", + "title":"Developing a Real-Time Processing Single-Task MRS Flink SQL Job", "githuburl":"" }, { "uri":"dataartsstudio_01_1824.html", "node_id":"dataartsstudio_01_1824.xml", "product_code":"dataartsstudio", - "code":"227", - "des":"A single-task real-time processing Flink Jar job has been created. For details, see Creating a Job.", + "code":"232", + "des":"A single-task real-time processing Flink Jar job has been created. For details, see Creating a Job.After setting the parameters, click Save and submit the job.Click Start", "doc_type":"usermanual", - "kw":"Developing a Real-Time Processing Single-Task Flink Jar Job,Job Development,User Guide", + "kw":"Developing a Real-Time Processing Single-Task MRS Flink Jar Job,Job Development,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Developing a Real-Time Processing Single-Task Flink Jar Job", + "title":"Developing a Real-Time Processing Single-Task MRS Flink Jar Job", "githuburl":"" }, { "uri":"dataartsstudio_01_1825.html", "node_id":"dataartsstudio_01_1825.xml", "product_code":"dataartsstudio", - "code":"228", - "des":"A single-task real-time processing DLI Spark job has been created. For details, see Creating a Job.", + "code":"233", + "des":"A single-task real-time processing DLI Spark job has been created. For details, see Creating a Job.After setting the parameters, click Save and submit the job.Click Start", "doc_type":"usermanual", "kw":"Developing a Real-Time Processing Single-Task DLI Spark Job,Job Development,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4803,7 +4911,7 @@ "uri":"dataartsstudio_01_0470.html", "node_id":"dataartsstudio_01_0470.xml", "product_code":"dataartsstudio", - "code":"229", + "code":"234", "des":"This section describes how to set up scheduling for an orchestrated job.If the processing mode of a job is batch processing, configure scheduling types for jobs. Three sc", "doc_type":"usermanual", "kw":"Setting Up Scheduling for a Job,Job Development,User Guide", @@ -4811,7 +4919,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4824,7 +4932,7 @@ "uri":"dataartsstudio_01_0902.html", "node_id":"dataartsstudio_01_0902.xml", "product_code":"dataartsstudio", - "code":"230", + "code":"235", "des":"Submitting a version depends on the version management function of DataArts Factory.Version management traces script and job changes, and supports version comparison and ", "doc_type":"usermanual", "kw":"Submitting a Version,Job Development,User Guide", @@ -4832,7 +4940,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4845,15 +4953,15 @@ "uri":"dataartsstudio_01_1903.html", "node_id":"dataartsstudio_01_1903.xml", "product_code":"dataartsstudio", - "code":"231", - "des":"In enterprise mode, when a developer submits a job version, the system generates a job release task. After the developer confirms the release task and the admin, deployer", + "code":"236", + "des":"In enterprise mode, when a developer submits a job version, the system generates a job release task. After the developer confirms releasing a package and the admin, deplo", "doc_type":"usermanual", "kw":"Releasing a Job Task,Job Development,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4866,7 +4974,7 @@ "uri":"dataartsstudio_01_0408.html", "node_id":"dataartsstudio_01_0408.xml", "product_code":"dataartsstudio", - "code":"232", + "code":"237", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"(Optional) Managing Jobs", @@ -4874,7 +4982,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4887,7 +4995,7 @@ "uri":"dataartsstudio_01_0440.html", "node_id":"dataartsstudio_01_0440.xml", "product_code":"dataartsstudio", - "code":"233", + "code":"238", "des":"This section describes how to copy a job.A job has been developed. For details about how to develop a job, see Developing a Pipeline Job.Log in to the DataArts Studio con", "doc_type":"usermanual", "kw":"Copying a Job,(Optional) Managing Jobs,User Guide", @@ -4895,7 +5003,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4908,7 +5016,7 @@ "uri":"dataartsstudio_01_0436.html", "node_id":"dataartsstudio_01_0436.xml", "product_code":"dataartsstudio", - "code":"234", + "code":"239", "des":"You can copy the name of a job and rename a job.A job has been developed. For details about how to develop a job, see Developing a Pipeline Job.Log in to the DataArts Stu", "doc_type":"usermanual", "kw":"Copying the Job Name and Renaming a Job,(Optional) Managing Jobs,User Guide", @@ -4916,7 +5024,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4929,7 +5037,7 @@ "uri":"dataartsstudio_01_0437.html", "node_id":"dataartsstudio_01_0437.xml", "product_code":"dataartsstudio", - "code":"235", + "code":"240", "des":"You can move a job file from one directory to another or move a job directory to another directory.A job has been developed. For details about how to develop a job, see D", "doc_type":"usermanual", "kw":"Moving a Job or Job Directory,(Optional) Managing Jobs,User Guide", @@ -4937,7 +5045,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4950,7 +5058,7 @@ "uri":"dataartsstudio_01_0438.html", "node_id":"dataartsstudio_01_0438.xml", "product_code":"dataartsstudio", - "code":"236", + "code":"241", "des":"Exporting jobs is to export the latest saved content in the development state.After a job is imported, the content in the development state is overwritten and a new versi", "doc_type":"usermanual", "kw":"Exporting and Importing Jobs,(Optional) Managing Jobs,User Guide", @@ -4958,7 +5066,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4971,15 +5079,15 @@ "uri":"dataartsstudio_01_0439.html", "node_id":"dataartsstudio_01_0439.xml", "product_code":"dataartsstudio", - "code":"237", - "des":"If you do not need to use a job any more, perform the following operations to delete it to reduce the quota usage of the job.Deleted jobs cannot be recovered. Exercise ca", + "code":"242", + "des":"If you do not need to use a job any longer, perform the following operations to delete it to reduce the quota usage of the job.Deleted jobs cannot be recovered. Exercise ", "doc_type":"usermanual", "kw":"Deleting a Job,(Optional) Managing Jobs,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -4992,7 +5100,7 @@ "uri":"dataartsstudio_01_0913.html", "node_id":"dataartsstudio_01_0913.xml", "product_code":"dataartsstudio", - "code":"238", + "code":"243", "des":"Script and job unlocking depends on the lock function of DataArts Factory.The lock function prevents conflict caused by collaborative script or job development. If you cr", "doc_type":"usermanual", "kw":"Unlocking a Job,(Optional) Managing Jobs,User Guide", @@ -5000,7 +5108,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5013,7 +5121,7 @@ "uri":"dataartsstudio_01_1097.html", "node_id":"dataartsstudio_01_1097.xml", "product_code":"dataartsstudio", - "code":"239", + "code":"244", "des":"You can view a job dependency graph to learn the upstream and downstream jobs associated with the job.Dependent jobs have been configured in the job scheduling configurat", "doc_type":"usermanual", "kw":"Viewing a Job Dependency Graph,(Optional) Managing Jobs,User Guide", @@ -5021,7 +5129,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5034,7 +5142,7 @@ "uri":"dataartsstudio_01_1101.html", "node_id":"dataartsstudio_01_1101.xml", "product_code":"dataartsstudio", - "code":"240", + "code":"245", "des":"DataArts Factory allows you to change the job owner with a few clicks.Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio", "doc_type":"usermanual", "kw":"Changing the Job Owner,(Optional) Managing Jobs,User Guide", @@ -5042,7 +5150,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5055,7 +5163,7 @@ "uri":"dataartsstudio_01_1108.html", "node_id":"dataartsstudio_01_1108.xml", "product_code":"dataartsstudio", - "code":"241", + "code":"246", "des":"This section describes how to unlock jobs in batches.Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console", "doc_type":"usermanual", "kw":"Unlocking Jobs,(Optional) Managing Jobs,User Guide", @@ -5063,7 +5171,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5076,7 +5184,7 @@ "uri":"dataartsstudio_01_1209.html", "node_id":"dataartsstudio_01_1209.xml", "product_code":"dataartsstudio", - "code":"242", + "code":"247", "des":"From the job directory tree, you can quickly switch to the job monitoring page to view the monitoring details of the job.Log in to the DataArts Studio console by followin", "doc_type":"usermanual", "kw":"Going to Monitor Job page,(Optional) Managing Jobs,User Guide", @@ -5084,7 +5192,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5093,11 +5201,32 @@ "title":"Going to Monitor Job page", "githuburl":"" }, + { + "uri":"dataartsstudio_01_1210.html", + "node_id":"dataartsstudio_01_1210.xml", + "product_code":"dataartsstudio", + "code":"248", + "des":"You can configure notifications for a job. Right-click a job name and select Configure Notification. For details, see Configuring Notifications.To modify existing notific", + "doc_type":"usermanual", + "kw":"Configuring Notifications,(Optional) Managing Jobs,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"Configuring Notifications", + "githuburl":"" + }, { "uri":"dataartsstudio_01_0503.html", "node_id":"dataartsstudio_01_0503.xml", "product_code":"dataartsstudio", - "code":"243", + "code":"249", "des":"The solution aims to provide users with convenient and systematic management operations and better meet service requirements and objectives. Each solution can contain one", "doc_type":"usermanual", "kw":"Solution,DataArts Factory,User Guide", @@ -5105,7 +5234,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5118,7 +5247,7 @@ "uri":"dataartsstudio_01_1105.html", "node_id":"dataartsstudio_01_1105.xml", "product_code":"dataartsstudio", - "code":"244", + "code":"250", "des":"This section describes how to view the execution history of scripts, jobs, and nodes over a week.This function depends on OBS buckets. For details about how to configure ", "doc_type":"usermanual", "kw":"Execution History,DataArts Factory,User Guide", @@ -5126,7 +5255,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5139,7 +5268,7 @@ "uri":"dataartsstudio_01_0505.html", "node_id":"dataartsstudio_01_0505.xml", "product_code":"dataartsstudio", - "code":"245", + "code":"251", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"O&M and Scheduling", @@ -5147,7 +5276,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5160,7 +5289,7 @@ "uri":"dataartsstudio_01_0506.html", "node_id":"dataartsstudio_01_0506.xml", "product_code":"dataartsstudio", - "code":"246", + "code":"252", "des":"Choose Monitoring > Overview. On the Overview page, you can view the statistics of job instances in charts. Currently, you can view seven types of statistics:StatusYou ca", "doc_type":"usermanual", "kw":"Overview,O&M and Scheduling,User Guide", @@ -5168,7 +5297,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5181,7 +5310,7 @@ "uri":"dataartsstudio_01_0413.html", "node_id":"dataartsstudio_01_0413.xml", "product_code":"dataartsstudio", - "code":"247", + "code":"253", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Monitoring a Job", @@ -5189,7 +5318,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5202,7 +5331,7 @@ "uri":"dataartsstudio_01_0508.html", "node_id":"dataartsstudio_01_0508.xml", "product_code":"dataartsstudio", - "code":"248", + "code":"254", "des":"In the batch processing mode, data is processed periodically in batches based on the job-level scheduling plan, which is used in scenarios with low real-time requirements", "doc_type":"usermanual", "kw":"Monitoring a Batch Job,Monitoring a Job,User Guide", @@ -5210,7 +5339,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5223,7 +5352,7 @@ "uri":"dataartsstudio_01_0509.html", "node_id":"dataartsstudio_01_0509.xml", "product_code":"dataartsstudio", - "code":"249", + "code":"255", "des":"In the real-time processing mode, data is processed in real time, which is used in scenarios with high real-time performance. This type of job is a pipeline that consists", "doc_type":"usermanual", "kw":"Monitoring a Real-Time Job,Monitoring a Job,User Guide", @@ -5231,7 +5360,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5244,7 +5373,7 @@ "uri":"dataartsstudio_01_0511.html", "node_id":"dataartsstudio_01_0511.xml", "product_code":"dataartsstudio", - "code":"250", + "code":"256", "des":"Each time a job is executed, a job instance record is generated. In the navigation pane of the DataArts Factory console, choose Monitoring. On the Monitor Instance page, ", "doc_type":"usermanual", "kw":"Instance Monitoring,O&M and Scheduling,User Guide", @@ -5252,7 +5381,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5265,7 +5394,7 @@ "uri":"dataartsstudio_01_0512.html", "node_id":"dataartsstudio_01_0512.xml", "product_code":"dataartsstudio", - "code":"251", + "code":"257", "des":"In the navigation tree of the DataArts Factory console, choose MonitoringMonitor PatchData.On the PatchData Monitoring page, you can view the PatchData job status, date, ", "doc_type":"usermanual", "kw":"Monitoring PatchData,O&M and Scheduling,User Guide", @@ -5273,7 +5402,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5286,36 +5415,36 @@ "uri":"dataartsstudio_01_0414.html", "node_id":"dataartsstudio_01_0414.xml", "product_code":"dataartsstudio", - "code":"252", + "code":"258", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"Managing Notifications", + "kw":"Notification Management", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"Managing Notifications", + "title":"Notification Management", "githuburl":"" }, { "uri":"dataartsstudio_01_0514.html", "node_id":"dataartsstudio_01_0514.xml", "product_code":"dataartsstudio", - "code":"253", + "code":"259", "des":"You can configure job notification tasks to notify you of job success or failures.Before configuring a notification for a job:Message notification has been enabled and a ", "doc_type":"usermanual", - "kw":"Managing Notifications,Managing Notifications,User Guide", + "kw":"Managing Notifications,Notification Management,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5328,15 +5457,15 @@ "uri":"dataartsstudio_01_0515.html", "node_id":"dataartsstudio_01_0515.xml", "product_code":"dataartsstudio", - "code":"254", + "code":"260", "des":"Notifications can be set to specified personnel by day, week, or month, allowing related personnel to regularly understand job scheduling information about the quantity o", "doc_type":"usermanual", - "kw":"Cycle Overview,Managing Notifications,User Guide", + "kw":"Cycle Overview,Notification Management,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5345,32 +5474,11 @@ "title":"Cycle Overview", "githuburl":"" }, - { - "uri":"dataartsstudio_01_2515.html", - "node_id":"dataartsstudio_01_2515.xml", - "product_code":"dataartsstudio", - "code":"255", - "des":"You can configure terminal subscriptions (SMS messages, emails, and phone calls) by owner. After configuring a subscription, you can use the Manage Notification function ", - "doc_type":"usermanual", - "kw":"Managing Terminal Subscriptions,Managing Notifications,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsBot":"No;yes", - "IsMulti":"No;no", - "documenttype":"usermanual", - "prodname":"dataartsstudio" - } - ], - "title":"Managing Terminal Subscriptions", - "githuburl":"" - }, { "uri":"dataartsstudio_01_0516.html", "node_id":"dataartsstudio_01_0516.xml", "product_code":"dataartsstudio", - "code":"256", + "code":"261", "des":"You can back up all jobs, scripts, resources, and environment variables at a specified interval.You can also restore assets that have been backed up, including jobs, scri", "doc_type":"usermanual", "kw":"Managing Backups,O&M and Scheduling,User Guide", @@ -5378,7 +5486,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5391,7 +5499,7 @@ "uri":"dataartsstudio_01_1822.html", "node_id":"dataartsstudio_01_1822.xml", "product_code":"dataartsstudio", - "code":"257", + "code":"262", "des":"You can view historical operations on the Operation History page. The system stores data for a maximum of three months and automatically deletes older data.Log in to the ", "doc_type":"usermanual", "kw":"Operation History,O&M and Scheduling,User Guide", @@ -5399,7 +5507,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5412,7 +5520,7 @@ "uri":"dataartsstudio_01_0517.html", "node_id":"dataartsstudio_01_0517.xml", "product_code":"dataartsstudio", - "code":"258", + "code":"263", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Configuration and Management", @@ -5420,7 +5528,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5433,7 +5541,7 @@ "uri":"dataartsstudio_01_0510.html", "node_id":"dataartsstudio_01_0510.xml", "product_code":"dataartsstudio", - "code":"259", + "code":"264", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Configuring Resources", @@ -5441,7 +5549,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5454,7 +5562,7 @@ "uri":"dataartsstudio_01_0504.html", "node_id":"dataartsstudio_01_0504.xml", "product_code":"dataartsstudio", - "code":"260", + "code":"265", "des":"This topic describes how to configure and use environment variables.Configure job parameters. If a parameter belongs to multiple jobs, you can extract this parameter as a", "doc_type":"usermanual", "kw":"Configuring Environment Variables,Configuring Resources,User Guide", @@ -5462,7 +5570,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5475,7 +5583,7 @@ "uri":"dataartsstudio_01_1106.html", "node_id":"dataartsstudio_01_1106.xml", "product_code":"dataartsstudio", - "code":"261", + "code":"266", "des":"The execution history of scripts, jobs, and nodes is stored in OBS buckets. If no OBS bucket is available, you cannot view the execution history. This section describes h", "doc_type":"usermanual", "kw":"Configuring an OBS Bucket,Configuring Resources,User Guide", @@ -5483,7 +5591,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5496,7 +5604,7 @@ "uri":"dataartsstudio_01_0532.html", "node_id":"dataartsstudio_01_0532.xml", "product_code":"dataartsstudio", - "code":"262", + "code":"267", "des":"Job tags are used to label jobs of the same or similar purposes to facilitate job management and query. This section describes how to manage job tags, including adding, d", "doc_type":"usermanual", "kw":"Managing Job Tags,Configuring Resources,User Guide", @@ -5504,7 +5612,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5517,7 +5625,7 @@ "uri":"dataartsstudio_01_0555.html", "node_id":"dataartsstudio_01_0555.xml", "product_code":"dataartsstudio", - "code":"263", + "code":"268", "des":"The following problems may occur during job execution in DataArts Factory:The job execution mechanism of the DataArts Factory module is to execute the job as the user who", "doc_type":"usermanual", "kw":"Configuring a Scheduling Identity,Configuring Resources,User Guide", @@ -5525,7 +5633,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5538,7 +5646,7 @@ "uri":"dataartsstudio_01_1280.html", "node_id":"dataartsstudio_01_1280.xml", "product_code":"dataartsstudio", - "code":"264", + "code":"269", "des":"This section describes how to configure the maximum number of job nodes that can run concurrently in a workspace.The number of concurrently running nodes in the workspace", "doc_type":"usermanual", "kw":"Configuring the Number of Concurrently Running Nodes,Configuring Resources,User Guide", @@ -5546,7 +5654,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5559,15 +5667,15 @@ "uri":"dataartsstudio_01_1282.html", "node_id":"dataartsstudio_01_1282.xml", "product_code":"dataartsstudio", - "code":"265", - "des":"This section describes how to create and use a Flink SQL template. When writing Flink SQL code, you can use an SQL template for repeated service logic. In addition, you c", + "code":"270", + "des":"This section describes how to create and use a template. When writing code, you can use an SQL template for repeated service logic. In addition, you can use a job paramet", "doc_type":"usermanual", "kw":"Configuring a Template,Configuring Resources,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5580,15 +5688,15 @@ "uri":"dataartsstudio_01_1283.html", "node_id":"dataartsstudio_01_1283.xml", "product_code":"dataartsstudio", - "code":"266", - "des":"You can configure a scheduling calendar and specify the working days for scheduling a job.This function is available for batch processing jobs but not for real-time proce", + "code":"271", + "des":"You can configure a scheduling calendar and specify the working days for scheduling a job.After creating a scheduling calendar, you can go to the DataArts Factory console", "doc_type":"usermanual", "kw":"Configuring a Scheduling Calendar,Configuring Resources,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5601,7 +5709,7 @@ "uri":"dataartsstudio_01_04501.html", "node_id":"dataartsstudio_01_04501.xml", "product_code":"dataartsstudio", - "code":"267", + "code":"272", "des":"This section describes how to configure a default item. You can perform the operations in this section only if you have the permissions of DARTS Administrator or Tenant A", "doc_type":"usermanual", "kw":"Configuring a Default Item,Configuring Resources,User Guide", @@ -5609,7 +5717,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5622,7 +5730,7 @@ "uri":"dataartsstudio_01_1284.html", "node_id":"dataartsstudio_01_1284.xml", "product_code":"dataartsstudio", - "code":"268", + "code":"273", "des":"By configuring a task group, you can control the maximum number of concurrent nodes in a task group in a more fine-grained manner.This function is available only for batc", "doc_type":"usermanual", "kw":"Configuring Task Groups,Configuring Resources,User Guide", @@ -5630,7 +5738,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5643,7 +5751,7 @@ "uri":"dataartsstudio_01_0519.html", "node_id":"dataartsstudio_01_0519.xml", "product_code":"dataartsstudio", - "code":"269", + "code":"274", "des":"You can upload custom code or text files as resources on Manage Resource and schedule them when running nodes. Nodes that can invoke resources include DLI Spark, MRS Spar", "doc_type":"usermanual", "kw":"Managing Resources,Configuration and Management,User Guide", @@ -5651,7 +5759,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5664,15 +5772,15 @@ "uri":"dataartsstudio_01_1820.html", "node_id":"dataartsstudio_01_1820.xml", "product_code":"dataartsstudio", - "code":"270", - "des":"For a workspace in simple mode, you can set the reviewer for the scripts and jobs you submit.Only the admin of the current workspace can manage reviewers, including creat", + "code":"275", + "des":"For a workspace in simple mode, you can set the reviewer for the scripts and jobs you submit. In the review center, you can manage applications and configure and maintain", "doc_type":"usermanual", "kw":"Review Center,DataArts Factory,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5685,7 +5793,7 @@ "uri":"dataartsstudio_01_1821.html", "node_id":"dataartsstudio_01_1821.xml", "product_code":"dataartsstudio", - "code":"271", + "code":"276", "des":"You can download or dump SQL script execution results. After downloading or dumping the SQL execution results, you can view them on the Download Center page.Records are g", "doc_type":"usermanual", "kw":"Download Center,DataArts Factory,User Guide", @@ -5693,7 +5801,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5706,7 +5814,7 @@ "uri":"dataartsstudio_01_0441.html", "node_id":"dataartsstudio_01_0441.xml", "product_code":"dataartsstudio", - "code":"272", + "code":"277", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Node Reference", @@ -5714,7 +5822,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5727,7 +5835,7 @@ "uri":"dataartsstudio_01_0442.html", "node_id":"dataartsstudio_01_0442.xml", "product_code":"dataartsstudio", - "code":"273", + "code":"278", "des":"A node defines the operations performed on data. DataArts Factory provides nodes used for data integration, computing and analysis, database operations, and resource mana", "doc_type":"usermanual", "kw":"Node Overview,Node Reference,User Guide", @@ -5735,7 +5843,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5748,7 +5856,7 @@ "uri":"dataartsstudio_01_0443.html", "node_id":"dataartsstudio_01_0443.xml", "product_code":"dataartsstudio", - "code":"274", + "code":"279", "des":"The CDM Job node is used to run a predefined CDM job for data migration.If you have configured a macro variable of date and time in a CDM job and schedule the CDM job thr", "doc_type":"usermanual", "kw":"CDM Job,Node Reference,User Guide", @@ -5756,7 +5864,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5769,7 +5877,7 @@ "uri":"dataartsstudio_01_0447.html", "node_id":"dataartsstudio_01_0447.xml", "product_code":"dataartsstudio", - "code":"275", + "code":"280", "des":"The Rest Client node is used to respond to RESTful requests in cloud.For details about how to use the Rest Client operator, see Obtaining the Return Value of a Rest Clien", "doc_type":"usermanual", "kw":"Rest Client,Node Reference,User Guide", @@ -5777,7 +5885,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5790,7 +5898,7 @@ "uri":"dataartsstudio_01_0448.html", "node_id":"dataartsstudio_01_0448.xml", "product_code":"dataartsstudio", - "code":"276", + "code":"281", "des":"The Import GES node is used to import files from an OBS bucket to a GES graph.Table 1 and Table 2 describe the parameters of the Import GES node.", "doc_type":"usermanual", "kw":"Import GES,Node Reference,User Guide", @@ -5798,7 +5906,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5811,7 +5919,7 @@ "uri":"dataartsstudio_01_0537.html", "node_id":"dataartsstudio_01_0537.xml", "product_code":"dataartsstudio", - "code":"277", + "code":"282", "des":"The MRS Kafka node is used to query the number of messages that are not consumed by a topic.Table 1 and Table 2 describe the parameters of the MRS Kafka node.", "doc_type":"usermanual", "kw":"MRS Kafka,Node Reference,User Guide", @@ -5819,7 +5927,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5832,7 +5940,7 @@ "uri":"dataartsstudio_01_0538.html", "node_id":"dataartsstudio_01_0538.xml", "product_code":"dataartsstudio", - "code":"278", + "code":"283", "des":"The Kafka Client node is used to send data to Kafka topics.You can learn more about how to use the Kafka Client node in .Table 1 describes the parameters of the Kafka Cli", "doc_type":"usermanual", "kw":"Kafka Client,Node Reference,User Guide", @@ -5840,7 +5948,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5853,7 +5961,7 @@ "uri":"dataartsstudio_01_1098.html", "node_id":"dataartsstudio_01_1098.xml", "product_code":"dataartsstudio", - "code":"279", + "code":"284", "des":"The ROMA FDI Job node executes a predefined ROMA Connect data integration task to implement data integration and conversion between the source and destination.This node e", "doc_type":"usermanual", "kw":"ROMA FDI Job,Node Reference,User Guide", @@ -5861,7 +5969,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5874,36 +5982,36 @@ "uri":"dataartsstudio_01_0536.html", "node_id":"dataartsstudio_01_0536.xml", "product_code":"dataartsstudio", - "code":"280", + "code":"285", "des":"The DLI Flink Job node is used to create and start jobs or check whether DLI jobs are running to analyze streaming big data in real time.After a DLI Flink streaming job i", "doc_type":"usermanual", - "kw":"DLI Flink Job,Node Reference,User Guide", + "kw":"DLI Flink Job,Node Reference,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"DLI Flink Job", + "title":"DLI Flink Job", "githuburl":"" }, { "uri":"dataartsstudio_01_0450.html", "node_id":"dataartsstudio_01_0450.xml", "product_code":"dataartsstudio", - "code":"281", - "des":"The DLI SQL node is used to transfer SQL statements to DLI for data source analysis and exploration.This node enables you to execute DLI statements during periodical or r", + "code":"286", + "des":"The DLI SQL node is used to transfer SQL statements to DLI SQL for data source analysis and exploration.This node enables you to execute DLI statements during periodical ", "doc_type":"usermanual", "kw":"DLI SQL,Node Reference,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5916,7 +6024,7 @@ "uri":"dataartsstudio_01_0451.html", "node_id":"dataartsstudio_01_0451.xml", "product_code":"dataartsstudio", - "code":"282", + "code":"287", "des":"The DLI Spark node is used to execute a predefined Spark job.For details about how to use the DLI Spark node, see Developing a DLI Spark Job.Table 1, Table 2, and Table 3", "doc_type":"usermanual", "kw":"DLI Spark,Node Reference,User Guide", @@ -5924,7 +6032,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5937,7 +6045,7 @@ "uri":"dataartsstudio_01_0452.html", "node_id":"dataartsstudio_01_0452.xml", "product_code":"dataartsstudio", - "code":"283", + "code":"288", "des":"The DWS SQL node is used to transfer SQL statements to DWS.For details about how to use the DWS SQL operator, see Developing a DWS SQL Job.This node enables you to execut", "doc_type":"usermanual", "kw":"DWS SQL,Node Reference,User Guide", @@ -5945,7 +6053,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5958,7 +6066,7 @@ "uri":"dataartsstudio_01_0453.html", "node_id":"dataartsstudio_01_0453.xml", "product_code":"dataartsstudio", - "code":"284", + "code":"289", "des":"The MRS Spark SQL node is used to execute a predefined SparkSQL statement on MRS.Table 1, Table 2, and Table 3 describe the parameters of the MRS Spark SQLnode node.", "doc_type":"usermanual", "kw":"MRS Spark SQL,Node Reference,User Guide", @@ -5966,7 +6074,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -5979,7 +6087,7 @@ "uri":"dataartsstudio_01_0454.html", "node_id":"dataartsstudio_01_0454.xml", "product_code":"dataartsstudio", - "code":"285", + "code":"290", "des":"The MRS Hive SQL node is used to execute a predefined Hive SQL script in DataArts Factory.For details about how to use the MRS Hive SQL node, see Developing a Hive SQL Jo", "doc_type":"usermanual", "kw":"MRS Hive SQL,Node Reference,User Guide", @@ -5987,7 +6095,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6000,7 +6108,7 @@ "uri":"dataartsstudio_01_1099.html", "node_id":"dataartsstudio_01_1099.xml", "product_code":"dataartsstudio", - "code":"286", + "code":"291", "des":"The MRS Presto SQL node is used to execute the Presto SQL script predefined in DataArts Factory.Table 1, Table 2, and Table 3 describe the parameters of the MRS Presto SQ", "doc_type":"usermanual", "kw":"MRS Presto SQL,Node Reference,User Guide", @@ -6008,7 +6116,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6021,7 +6129,7 @@ "uri":"dataartsstudio_01_0455.html", "node_id":"dataartsstudio_01_0455.xml", "product_code":"dataartsstudio", - "code":"287", + "code":"292", "des":"The MRS Spark node is used to execute a predefined Spark job on MRS.Table 1, Table 2, and Table 3 describe the parameters of the MRS Sparknode node.", "doc_type":"usermanual", "kw":"MRS Spark,Node Reference,User Guide", @@ -6029,7 +6137,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6042,7 +6150,7 @@ "uri":"dataartsstudio_01_0456.html", "node_id":"dataartsstudio_01_0456.xml", "product_code":"dataartsstudio", - "code":"288", + "code":"293", "des":"The MRS Spark Python node is used to execute a predefined Spark Python job on MRS.For details about how to use the MRS Spark Python operator, see Developing an MRS Spark ", "doc_type":"usermanual", "kw":"MRS Spark Python,Node Reference,User Guide", @@ -6050,7 +6158,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6059,11 +6167,53 @@ "title":"MRS Spark Python", "githuburl":"" }, + { + "uri":"dataartsstudio_01_0528.html", + "node_id":"dataartsstudio_01_0528.xml", + "product_code":"dataartsstudio", + "code":"294", + "des":"The MRS ClickHouse node is used to execute the ClickHouse SQL script predefined in DataArts Factory.Table 1, Table 2, and Table 3 describe the parameters of the MRS Click", + "doc_type":"usermanual", + "kw":"MRS ClickHouse,Node Reference,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"MRS ClickHouse", + "githuburl":"" + }, + { + "uri":"dataartsstudio_01_1104.html", + "node_id":"dataartsstudio_01_1104.xml", + "product_code":"dataartsstudio", + "code":"295", + "des":"The MRS Impala SQL node is used to execute the Impala SQL script predefined in DataArts Factory.Table 1 and Table 2 describe the parameters of the MRS Impala node.", + "doc_type":"usermanual", + "kw":"MRS Impala SQL,Node Reference,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"MRS Impala SQL", + "githuburl":"" + }, { "uri":"dataartsstudio_01_0554.html", "node_id":"dataartsstudio_01_0554.xml", "product_code":"dataartsstudio", - "code":"289", + "code":"296", "des":"The MRS Flink Job node is used to execute the Flink SQL script and Flink job predefined in DataArts Factory.Table 1 and Table 2 describe the parameters of the MRS Flink n", "doc_type":"usermanual", "kw":"MRS Flink Job,Node Reference,User Guide", @@ -6071,7 +6221,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6084,7 +6234,7 @@ "uri":"dataartsstudio_01_0457.html", "node_id":"dataartsstudio_01_0457.xml", "product_code":"dataartsstudio", - "code":"290", + "code":"297", "des":"The MRS MapReduce node is used to execute a predefined MapReduce program on MRS.Table 1 and Table 2 describe the parameters of the MRS MapReduce node.", "doc_type":"usermanual", "kw":"MRS MapReduce,Node Reference,User Guide", @@ -6092,7 +6242,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6105,7 +6255,7 @@ "uri":"dataartsstudio_01_0458.html", "node_id":"dataartsstudio_01_0458.xml", "product_code":"dataartsstudio", - "code":"291", + "code":"298", "des":"The CSS node is used to process CSS requests and enable online distributed searching.Table 1 and Table 2 describe the parameters of the CSS node.", "doc_type":"usermanual", "kw":"CSS,Node Reference,User Guide", @@ -6113,7 +6263,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6126,7 +6276,7 @@ "uri":"dataartsstudio_01_0459.html", "node_id":"dataartsstudio_01_0459.xml", "product_code":"dataartsstudio", - "code":"292", + "code":"299", "des":"The Shell node is used to execute a shell script.With EL expression #{Job.getNodeOutput()}, you can obtain the desired content (4000 characters at most and counted backwa", "doc_type":"usermanual", "kw":"Shell,Node Reference,User Guide", @@ -6134,7 +6284,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6147,7 +6297,7 @@ "uri":"dataartsstudio_01_0460.html", "node_id":"dataartsstudio_01_0460.xml", "product_code":"dataartsstudio", - "code":"293", + "code":"300", "des":"The RDS SQL node is used to transfer SQL statements to RDS.Table 1 and Table 2 describe the parameters of the RDS SQL node.", "doc_type":"usermanual", "kw":"RDS SQL,Node Reference,User Guide", @@ -6155,7 +6305,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6168,7 +6318,7 @@ "uri":"dataartsstudio_01_0461.html", "node_id":"dataartsstudio_01_0461.xml", "product_code":"dataartsstudio", - "code":"294", + "code":"301", "des":"The ETL Job node is used to extract data from a specified data source, preprocess the data, and import the data to the target data source.The destination is the ETL Job n", "doc_type":"usermanual", "kw":"ETL Job,Node Reference,User Guide", @@ -6176,7 +6326,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6189,7 +6339,7 @@ "uri":"dataartsstudio_01_4504.html", "node_id":"dataartsstudio_01_4504.xml", "product_code":"dataartsstudio", - "code":"295", + "code":"302", "des":"Before using a Python node, ensure that the host connected to the node has an environment for executing Python scripts.The Python node is used to execute Python statement", "doc_type":"usermanual", "kw":"Python,Node Reference,User Guide", @@ -6197,7 +6347,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6206,11 +6356,32 @@ "title":"Python", "githuburl":"" }, + { + "uri":"dataartsstudio_01_4509.html", + "node_id":"dataartsstudio_01_4509.xml", + "product_code":"dataartsstudio", + "code":"303", + "des":"The Doris SQL node transfers SQL statements to Doris for execution.Table 1 and Table 2 describe the parameters of the Doris SQL node.", + "doc_type":"usermanual", + "kw":"DORIS SQL,Node Reference,User Guide", + "search_title":"", + "metedata":[ + { + "opensource":"false;true", + "IsBot":"No;yes;Yes", + "IsMulti":"No;no", + "documenttype":"usermanual", + "prodname":"dataartsstudio" + } + ], + "title":"DORIS SQL", + "githuburl":"" + }, { "uri":"dataartsstudio_01_4500.html", "node_id":"dataartsstudio_01_4500.xml", "product_code":"dataartsstudio", - "code":"296", + "code":"304", "des":"You can orchestrate ModelArts Train operators to schedule the ModelArts workflow in DataArts Studio.Table 1 and Table 2 describe the parameters of the ModelArts Train nod", "doc_type":"usermanual", "kw":"ModelArts Train,Node Reference,User Guide", @@ -6218,7 +6389,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6227,32 +6398,11 @@ "title":"ModelArts Train", "githuburl":"" }, - { - "uri":"dataartsstudio_01_0489.html", - "node_id":"dataartsstudio_01_0489.xml", - "product_code":"dataartsstudio", - "code":"297", - "des":"Http Trigger is a cross-platform scheduling trigger node of DataArts Studio. If you want to trigger a job on DataArts Studio after a job on another scheduling system is c", - "doc_type":"usermanual", - "kw":"Http Trigger,Node Reference,User Guide", - "search_title":"", - "metedata":[ - { - "opensource":"false;true", - "IsBot":"No;yes", - "IsMulti":"No;no", - "documenttype":"usermanual", - "prodname":"dataartsstudio" - } - ], - "title":"Http Trigger", - "githuburl":"" - }, { "uri":"dataartsstudio_01_0462.html", "node_id":"dataartsstudio_01_0462.xml", "product_code":"dataartsstudio", - "code":"298", + "code":"305", "des":"The OBS path cannot be a log path starting with s3a://.This function depends on OBS.The Create OBS node is used to create buckets and directories on OBS.Table 1 and Table", "doc_type":"usermanual", "kw":"Create OBS,Node Reference,User Guide", @@ -6260,7 +6410,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6273,7 +6423,7 @@ "uri":"dataartsstudio_01_0463.html", "node_id":"dataartsstudio_01_0463.xml", "product_code":"dataartsstudio", - "code":"299", + "code":"306", "des":"This function depends on OBS.The Delete OBS node is used to delete a bucket or directory on OBS.Table 1 and Table 2 describe the parameters of the Delete OBS node.", "doc_type":"usermanual", "kw":"Delete OBS,Node Reference,User Guide", @@ -6281,7 +6431,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6294,7 +6444,7 @@ "uri":"dataartsstudio_01_0464.html", "node_id":"dataartsstudio_01_0464.xml", "product_code":"dataartsstudio", - "code":"300", + "code":"307", "des":"This function depends on OBS.The OBS Manager node is used to move or copy files from an OBS bucket to a specified directory.Table 1, Table 2, and Table 3 describe the par", "doc_type":"usermanual", "kw":"OBS Manager,Node Reference,User Guide", @@ -6302,7 +6452,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6315,15 +6465,15 @@ "uri":"dataartsstudio_01_0465.html", "node_id":"dataartsstudio_01_0465.xml", "product_code":"dataartsstudio", - "code":"301", - "des":"You can use the Open/Close Resource node to enable or disable cloud services as required.Table 1 and Table 2 describe the parameters of the Open/Close Resource node.", + "code":"308", + "des":"You can use the Open/Close Resource node to enable or disable services as required.Table 1 and Table 2 describe the parameters of the Open/Close Resource node.", "doc_type":"usermanual", "kw":"Open/Close Resource,Node Reference,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6336,7 +6486,7 @@ "uri":"dataartsstudio_01_0467.html", "node_id":"dataartsstudio_01_0467.xml", "product_code":"dataartsstudio", - "code":"302", + "code":"309", "des":"The Subjob node is used to call the batch job that does not contain the subjob node.Table 1 and Table 2 describe the parameters of the Subjob node.", "doc_type":"usermanual", "kw":"Subjob,Node Reference,User Guide", @@ -6344,7 +6494,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6357,7 +6507,7 @@ "uri":"dataartsstudio_01_0535.html", "node_id":"dataartsstudio_01_0535.xml", "product_code":"dataartsstudio", - "code":"303", + "code":"310", "des":"The For Each node specifies a subjob to be executed cyclically and assigns values to variables in a subjob with a dataset.When a For Each node is executed once, a specifi", "doc_type":"usermanual", "kw":"For Each,Node Reference,User Guide", @@ -6365,7 +6515,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6378,7 +6528,7 @@ "uri":"dataartsstudio_01_0468.html", "node_id":"dataartsstudio_01_0468.xml", "product_code":"dataartsstudio", - "code":"304", + "code":"311", "des":"The SMN node is used to send notifications to users.Table 1 and Table 2 describe the parameters of the SMN node.", "doc_type":"usermanual", "kw":"SMN,Node Reference,User Guide", @@ -6386,7 +6536,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6399,7 +6549,7 @@ "uri":"dataartsstudio_01_0469.html", "node_id":"dataartsstudio_01_0469.xml", "product_code":"dataartsstudio", - "code":"305", + "code":"312", "des":"The Dummy node is empty and does not perform any operations. It is used to simplify the complex connection relationships of nodes. Figure 1 shows an example.Table 1 descr", "doc_type":"usermanual", "kw":"Dummy,Node Reference,User Guide", @@ -6407,7 +6557,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6420,7 +6570,7 @@ "uri":"dataartsstudio_01_0493.html", "node_id":"dataartsstudio_01_0493.xml", "product_code":"dataartsstudio", - "code":"306", + "code":"313", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"EL Expression Reference", @@ -6428,7 +6578,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6441,7 +6591,7 @@ "uri":"dataartsstudio_01_0494.html", "node_id":"dataartsstudio_01_0494.xml", "product_code":"dataartsstudio", - "code":"307", + "code":"314", "des":"Node parameter values in a DataArts Factory job can be dynamically generated based on the running environment by using Expression Language (EL). You can determine whether", "doc_type":"usermanual", "kw":"Expression Overview,EL Expression Reference,User Guide", @@ -6449,7 +6599,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6462,7 +6612,7 @@ "uri":"dataartsstudio_01_0495.html", "node_id":"dataartsstudio_01_0495.xml", "product_code":"dataartsstudio", - "code":"308", + "code":"315", "des":"EL supports most of the arithmetic and logic operators provided by Java.If variable a is empty, default is returned. If variable a is not empty, a itself is returned. The", "doc_type":"usermanual", "kw":"Basic Operators,EL Expression Reference,User Guide", @@ -6470,7 +6620,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6483,7 +6633,7 @@ "uri":"dataartsstudio_01_0496.html", "node_id":"dataartsstudio_01_0496.xml", "product_code":"dataartsstudio", - "code":"309", + "code":"316", "des":"The date and time in the EL expression can be displayed in a user-specified format. The date and time format is specified by the date and time mode character string. The ", "doc_type":"usermanual", "kw":"Date and Time Mode,EL Expression Reference,User Guide", @@ -6491,7 +6641,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6504,7 +6654,7 @@ "uri":"dataartsstudio_01_0497.html", "node_id":"dataartsstudio_01_0497.xml", "product_code":"dataartsstudio", - "code":"310", + "code":"317", "des":"An Env embedded object provides a method of obtaining an environment variable value.The EL expression used to obtain the value of environment variable test is as follows:", "doc_type":"usermanual", "kw":"Env Embedded Objects,EL Expression Reference,User Guide", @@ -6512,7 +6662,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6525,7 +6675,7 @@ "uri":"dataartsstudio_01_0498.html", "node_id":"dataartsstudio_01_0498.xml", "product_code":"dataartsstudio", - "code":"311", + "code":"318", "des":"A job object provides properties and methods of obtaining the output message, job scheduling plan time, and job execution time of the previous node in a job.The expressio", "doc_type":"usermanual", "kw":"Job Embedded Objects,EL Expression Reference,User Guide", @@ -6533,7 +6683,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6546,7 +6696,7 @@ "uri":"dataartsstudio_01_0499.html", "node_id":"dataartsstudio_01_0499.xml", "product_code":"dataartsstudio", - "code":"312", + "code":"319", "des":"A StringUtil embedded object provides methods of operating character strings, for example, truncating a substring from a character string.StringUtil is implemented throug", "doc_type":"usermanual", "kw":"StringUtil Embedded Objects,EL Expression Reference,User Guide", @@ -6554,7 +6704,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6567,7 +6717,7 @@ "uri":"dataartsstudio_01_0500.html", "node_id":"dataartsstudio_01_0500.xml", "product_code":"dataartsstudio", - "code":"313", + "code":"320", "des":"A DateUtil embedded object provides methods of formatting time and calculating time.The previous day of the job scheduling plan time is used as the subdirectory name to g", "doc_type":"usermanual", "kw":"DateUtil Embedded Objects,EL Expression Reference,User Guide", @@ -6575,7 +6725,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6588,7 +6738,7 @@ "uri":"dataartsstudio_01_0501.html", "node_id":"dataartsstudio_01_0501.xml", "product_code":"dataartsstudio", - "code":"314", + "code":"321", "des":"A JSONUtil embedded object provides JSON object methods.The content of variable str is as follows:The expression for obtaining the area code of city1 is as follows:", "doc_type":"usermanual", "kw":"JSONUtil Embedded Objects,EL Expression Reference,User Guide", @@ -6596,7 +6746,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6609,7 +6759,7 @@ "uri":"dataartsstudio_01_0534.html", "node_id":"dataartsstudio_01_0534.xml", "product_code":"dataartsstudio", - "code":"315", + "code":"322", "des":"You can use Loop embedded objects to obtain data from the For Each node.To obtain the second value of a row that is being processed, use the following EL expression:", "doc_type":"usermanual", "kw":"Loop Embedded Objects,EL Expression Reference,User Guide", @@ -6617,7 +6767,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6630,7 +6780,7 @@ "uri":"dataartsstudio_01_0553.html", "node_id":"dataartsstudio_01_0553.xml", "product_code":"dataartsstudio", - "code":"316", + "code":"323", "des":"The OBSUtil embedded objects provide a series of OBS operation methods, for example, checking whether an OBS file or directory exists.The following is the EL expression f", "doc_type":"usermanual", "kw":"OBSUtil Embedded Objects,EL Expression Reference,User Guide", @@ -6638,7 +6788,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6651,7 +6801,7 @@ "uri":"dataartsstudio_01_4803.html", "node_id":"dataartsstudio_01_4803.xml", "product_code":"dataartsstudio", - "code":"317", + "code":"324", "des":"This section describes common EL expressions and examples.", "doc_type":"usermanual", "kw":"Examples of Common EL Expressions,EL Expression Reference,User Guide", @@ -6659,7 +6809,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6672,7 +6822,7 @@ "uri":"dataartsstudio_01_0502.html", "node_id":"dataartsstudio_01_0502.xml", "product_code":"dataartsstudio", - "code":"318", + "code":"325", "des":"With this example, you can understand how to use EL expressions in the following applications:Using variables in the SQL script of DataArts FactoryTransferring parameters", "doc_type":"usermanual", "kw":"EL Expression Use Examples,EL Expression Reference,User Guide", @@ -6680,7 +6830,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6693,7 +6843,7 @@ "uri":"dataartsstudio_01_0556.html", "node_id":"dataartsstudio_01_0556.xml", "product_code":"dataartsstudio", - "code":"319", + "code":"326", "des":"The simple variable set provides a series of customized variables. Customized parameters are automatically replaced with specific values based on the service date, plan t", "doc_type":"usermanual", "kw":"Simple Variable Set,DataArts Factory,User Guide", @@ -6701,7 +6851,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6714,7 +6864,7 @@ "uri":"dataartsstudio_01_0520.html", "node_id":"dataartsstudio_01_0520.xml", "product_code":"dataartsstudio", - "code":"320", + "code":"327", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Usage Guidance", @@ -6722,7 +6872,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6735,7 +6885,7 @@ "uri":"dataartsstudio_01_7524.html", "node_id":"dataartsstudio_01_7524.xml", "product_code":"dataartsstudio", - "code":"321", + "code":"328", "des":"This section describes how to reference parameters in scripts and jobs, application scope of the referenced parameters, and whether EL expressions and simple variable set", "doc_type":"usermanual", "kw":"Referencing Parameters in Scripts and Jobs,Usage Guidance,User Guide", @@ -6743,7 +6893,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6756,7 +6906,7 @@ "uri":"dataartsstudio_01_7523.html", "node_id":"dataartsstudio_01_7523.xml", "product_code":"dataartsstudio", - "code":"322", + "code":"329", "des":"When configuring job scheduling, you can set the scheduling time to the last day of each month using either of the two methods provided in the following table.In DataArts", "doc_type":"usermanual", "kw":"Setting the Job Scheduling Time to the Last Day of Each Month,Usage Guidance,User Guide", @@ -6764,7 +6914,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6777,7 +6927,7 @@ "uri":"dataartsstudio_01_7564.html", "node_id":"dataartsstudio_01_7564.xml", "product_code":"dataartsstudio", - "code":"323", + "code":"330", "des":"This section describes how to configure a job that is scheduled at a specified time of a year.In DataArts Studio, create a job that is scheduled every month and add an em", "doc_type":"usermanual", "kw":"Configuring a Yearly Scheduled Job,Usage Guidance,User Guide", @@ -6785,7 +6935,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6798,7 +6948,7 @@ "uri":"dataartsstudio_01_0585.html", "node_id":"dataartsstudio_01_0585.xml", "product_code":"dataartsstudio", - "code":"324", + "code":"331", "des":"In the migration of a project, if you want to supplement historical business data in a previous period and view details of the historical data, PatchData can meet your re", "doc_type":"usermanual", "kw":"Using PatchData,Usage Guidance,User Guide", @@ -6806,7 +6956,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6819,7 +6969,7 @@ "uri":"dataartsstudio_01_0584.html", "node_id":"dataartsstudio_01_0584.xml", "product_code":"dataartsstudio", - "code":"325", + "code":"332", "des":"This section describes how to obtain the output of an SQL node and apply the output to subsequent nodes or judgment in job development.When you use EL expression #{Job.ge", "doc_type":"usermanual", "kw":"Obtaining the Output of an SQL Node,Usage Guidance,User Guide", @@ -6827,7 +6977,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6840,7 +6990,7 @@ "uri":"dataartsstudio_01_1584.html", "node_id":"dataartsstudio_01_1584.xml", "product_code":"dataartsstudio", - "code":"326", + "code":"333", "des":"You can run a query SQL statement to transfer the obtained maximum time value to a CDM job. In the advanced attributes of the CDM job, the where clause is used to determi", "doc_type":"usermanual", "kw":"Obtaining the Maximum Value and Transferring It to a CDM Job Using a Query SQL Statement,Usage Guida", @@ -6848,7 +6998,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6861,7 +7011,7 @@ "uri":"dataartsstudio_01_0583.html", "node_id":"dataartsstudio_01_0583.xml", "product_code":"dataartsstudio", - "code":"327", + "code":"334", "des":"When developing and orchestrating jobs in DataArts Factory, you can use IF statements to determine the branch to execute.This section describes how to use IF statements i", "doc_type":"usermanual", "kw":"IF Statements,Usage Guidance,User Guide", @@ -6869,7 +7019,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6882,7 +7032,7 @@ "uri":"dataartsstudio_01_0581.html", "node_id":"dataartsstudio_01_0581.xml", "product_code":"dataartsstudio", - "code":"328", + "code":"335", "des":"The Rest Client node can execute RESTful requests.This tutorial describes how to obtain the return value of the Rest Client node, covering the following two application s", "doc_type":"usermanual", "kw":"Obtaining the Return Value of a Rest Client Node,Usage Guidance,User Guide", @@ -6890,7 +7040,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6903,7 +7053,7 @@ "uri":"dataartsstudio_01_0582.html", "node_id":"dataartsstudio_01_0582.xml", "product_code":"dataartsstudio", - "code":"329", + "code":"336", "des":"During job development, if some jobs have different parameters but the same processing logic, you can use For Each nodes to avoid repeated job development.You can use a F", "doc_type":"usermanual", "kw":"Using For Each Nodes,Usage Guidance,User Guide", @@ -6911,7 +7061,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6924,7 +7074,7 @@ "uri":"dataartsstudio_01_1582.html", "node_id":"dataartsstudio_01_1582.xml", "product_code":"dataartsstudio", - "code":"330", + "code":"337", "des":"This function applies to the following scenarios:Use a script template for a Flink SQL script.During pipeline job development, use a Fink SQL script which uses a script t", "doc_type":"usermanual", "kw":"Using Script Templates and Parameter Templates,Usage Guidance,User Guide", @@ -6932,7 +7082,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6945,7 +7095,7 @@ "uri":"dataartsstudio_01_0529.html", "node_id":"dataartsstudio_01_0529.xml", "product_code":"dataartsstudio", - "code":"331", + "code":"338", "des":"This section describes how to develop and execute a Python job using DataArts Factory.An ECS named ecs-dgc has been created.In this example, the ECS uses the CentOS 8.0 6", "doc_type":"usermanual", "kw":"Developing a Python Job,Usage Guidance,User Guide", @@ -6953,7 +7103,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6966,7 +7116,7 @@ "uri":"dataartsstudio_01_0524.html", "node_id":"dataartsstudio_01_0524.xml", "product_code":"dataartsstudio", - "code":"332", + "code":"339", "des":"This section describes how to use the DWS SQL node to develop a job in DataArts Factory.This tutorial describes how to develop a DWS job to collect the sales volume of a ", "doc_type":"usermanual", "kw":"Developing a DWS SQL Job,Usage Guidance,User Guide", @@ -6974,7 +7124,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -6987,7 +7137,7 @@ "uri":"dataartsstudio_01_0522.html", "node_id":"dataartsstudio_01_0522.xml", "product_code":"dataartsstudio", - "code":"333", + "code":"340", "des":"This section introduces how to develop Hive SQL scripts on DataArts Factory.As a one-stop big data development platform, DataArts Factory supports development of multiple", "doc_type":"usermanual", "kw":"Developing a Hive SQL Job,Usage Guidance,User Guide", @@ -6995,7 +7145,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -7008,7 +7158,7 @@ "uri":"dataartsstudio_01_0521.html", "node_id":"dataartsstudio_01_0521.xml", "product_code":"dataartsstudio", - "code":"334", + "code":"341", "des":"This section introduces how to develop a DLI Spark job on DataArts Factory.In most cases, SQL is used to analyze and process data when using Data Lake Insight (DLI). Howe", "doc_type":"usermanual", "kw":"Developing a DLI Spark Job,Usage Guidance,User Guide", @@ -7016,7 +7166,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -7029,7 +7179,7 @@ "uri":"dataartsstudio_01_0525.html", "node_id":"dataartsstudio_01_0525.xml", "product_code":"dataartsstudio", - "code":"335", + "code":"342", "des":"This section describes how to develop an MRS Spark Python on DataArts Factory.PrerequisitesYou have the permission to access OBS paths.Data preparationPrepare the script ", "doc_type":"usermanual", "kw":"Developing an MRS Spark Python Job,Usage Guidance,User Guide", @@ -7037,7 +7187,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -7050,7 +7200,7 @@ "uri":"dataartsstudio_01_1200.html", "node_id":"dataartsstudio_01_1200.xml", "product_code":"dataartsstudio", - "code":"336", + "code":"343", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Audit Log", @@ -7058,7 +7208,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -7071,7 +7221,7 @@ "uri":"dataartsstudio_01_0127.html", "node_id":"dataartsstudio_01_0127.xml", "product_code":"dataartsstudio", - "code":"337", + "code":"344", "des":"You can use Cloud Trace Service (CTS) to record key operation events related to DataArts Studio. The events can be used in various scenarios such as security analysis, co", "doc_type":"usermanual", "kw":"Viewing Traces,Audit Log,User Guide", @@ -7079,7 +7229,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -7092,7 +7242,7 @@ "uri":"dataartsstudio_01_1207.html", "node_id":"dataartsstudio_01_1207.xml", "product_code":"dataartsstudio", - "code":"338", + "code":"345", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Key Operations Recorded by CTS", @@ -7100,7 +7250,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -7113,7 +7263,7 @@ "uri":"dataartsstudio_01_1201.html", "node_id":"dataartsstudio_01_1201.xml", "product_code":"dataartsstudio", - "code":"339", + "code":"346", "des":"CTS provides records of operations on cloud service resources. With CTS, you can query, audit, and backtrack those operations.", "doc_type":"usermanual", "kw":"Management Center Operations,Key Operations Recorded by CTS,User Guide", @@ -7121,7 +7271,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -7134,28 +7284,28 @@ "uri":"dataartsstudio_01_0126.html", "node_id":"dataartsstudio_01_0126.xml", "product_code":"dataartsstudio", - "code":"340", + "code":"347", "des":"CTS provides records of operations on cloud service resources. With CTS, you can query, audit, and backtrack those operations.", "doc_type":"usermanual", - "kw":"DataArts Migration Operations,Key Operations Recorded by CTS,User Guide", + "kw":"Key CDM Operations Recorded by CTS,Key Operations Recorded by CTS,User Guide", "search_title":"", "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" } ], - "title":"DataArts Migration Operations", + "title":"Key CDM Operations Recorded by CTS", "githuburl":"" }, { "uri":"dataartsstudio_01_1203.html", "node_id":"dataartsstudio_01_1203.xml", "product_code":"dataartsstudio", - "code":"341", + "code":"348", "des":"CTS provides records of operations on cloud service resources. With CTS, you can query, audit, and backtrack those operations.", "doc_type":"usermanual", "kw":"DataArts Factory Operations,Key Operations Recorded by CTS,User Guide", @@ -7163,7 +7313,7 @@ "metedata":[ { "opensource":"false;true", - "IsBot":"No;yes", + "IsBot":"No;yes;Yes", "IsMulti":"No;no", "documenttype":"usermanual", "prodname":"dataartsstudio" @@ -7176,7 +7326,7 @@ "uri":"dataartsstudio_12_0007.html", "node_id":"dataartsstudio_12_0007.xml", "product_code":"dataartsstudio", - "code":"342", + "code":"349", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"FAQs", @@ -7194,17 +7344,18 @@ "uri":"dataartsstudio_03_0001.html", "node_id":"dataartsstudio_03_0001.xml", "product_code":"dataartsstudio", - "code":"343", + "code":"350", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Consultation and Billing", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Consultation and Billing", @@ -7214,77 +7365,81 @@ "uri":"dataartsstudio_03_0052.html", "node_id":"dataartsstudio_03_0052.xml", "product_code":"dataartsstudio", - "code":"344", + "code":"351", "des":"We use a region to identify the location of a data center. You can create resources in a specific region.A region is a physical data center. Each region is completely ind", "doc_type":"usermanual", - "kw":"Regions,Consultation and Billing,User Guide", + "kw":"How Do I Select a Region?,Consultation and Billing,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Regions", - "githuburl":"" - }, - { - "uri":"dataartsstudio_03_0061.html", - "node_id":"dataartsstudio_03_0061.xml", - "product_code":"dataartsstudio", - "code":"345", - "des":"Check whether a user has been added to the workspace. If no, perform the following steps to add the user.", - "doc_type":"usermanual", - "kw":"What Should I Do If a User Cannot View Workspaces After I Have Assigned the Required Policy to the U", - "search_title":"", - "metedata":[ - { - "IsMulti":"no", - "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" - } - ], - "title":"What Should I Do If a User Cannot View Workspaces After I Have Assigned the Required Policy to the User?", + "title":"How Do I Select a Region?", "githuburl":"" }, { "uri":"dataartsstudio_03_0158.html", "node_id":"dataartsstudio_03_0158.xml", "product_code":"dataartsstudio", - "code":"346", + "code":"352", "des":"In DataArts Studio, system roles and workspace roles are used to assign permissions. By default, if a user is assigned the DARTS User system role but not a workspace role", "doc_type":"usermanual", "kw":"How Do I Isolate Workspaces So That Users Cannot View Unauthorized Workspaces?,Consultation and Bill", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Isolate Workspaces So That Users Cannot View Unauthorized Workspaces?", "githuburl":"" }, + { + "uri":"dataartsstudio_03_0061.html", + "node_id":"dataartsstudio_03_0061.xml", + "product_code":"dataartsstudio", + "code":"353", + "des":"If you assign only the DARTS User system role but not a workspace role to a user, the user cannot access a workspace and an error message is displayed.Check whether the u", + "doc_type":"usermanual", + "kw":"What Should I Do If a User Cannot View Workspaces After I Have Assigned the Required Policy to the U", + "search_title":"", + "metedata":[ + { + "prodname":"dataartsstudio", + "IsMulti":"no;No", + "documenttype":"usermanual", + "IsBot":"yes;No;Yes", + "opensource":"false;true" + } + ], + "title":"What Should I Do If a User Cannot View Workspaces After I Have Assigned the Required Policy to the User?", + "githuburl":"" + }, { "uri":"dataartsstudio_03_0222.html", "node_id":"dataartsstudio_03_0222.xml", "product_code":"dataartsstudio", - "code":"347", - "des":"Yes. The procedure is as follows.To prevent service loss caused by mis-deletion, the system allows only the DARTS Administrator or Tenant Administrator to delete workspac", + "code":"354", + "des":"Yes. The procedure is as follows.Mis-deletion may result in service loss. To delete a workspace, you must use the DARTS Administrator or Tenant Administrator account and ", "doc_type":"usermanual", "kw":"Can I Delete DataArts Studio Workspaces?,Consultation and Billing,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Can I Delete DataArts Studio Workspaces?", @@ -7294,17 +7449,18 @@ "uri":"dataartsstudio_03_0131.html", "node_id":"dataartsstudio_03_0131.xml", "product_code":"dataartsstudio", - "code":"348", + "code":"355", "des":"No. Purchased or trial instances cannot be transferred to another account.", "doc_type":"usermanual", "kw":"Can I Transfer a Purchased or Trial Instance to Another Account?,Consultation and Billing,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Can I Transfer a Purchased or Trial Instance to Another Account?", @@ -7314,17 +7470,18 @@ "uri":"dataartsstudio_03_0087.html", "node_id":"dataartsstudio_03_0087.xml", "product_code":"dataartsstudio", - "code":"349", - "des":"No. You cannot downgrade a purchased DataArts Studio instance.", + "code":"356", + "des":"The version of a created DataArts Studio instance cannot be directly downgraded.However, you can downgrade the version by creating an instance of an earlier version, migr", "doc_type":"usermanual", "kw":"Does DataArts Studio Support Version Downgrade?,Consultation and Billing,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Does DataArts Studio Support Version Downgrade?", @@ -7334,17 +7491,18 @@ "uri":"dataartsstudio_03_0022.html", "node_id":"dataartsstudio_03_0022.xml", "product_code":"dataartsstudio", - "code":"350", + "code":"357", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Management Center", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Management Center", @@ -7354,37 +7512,39 @@ "uri":"dataartsstudio_03_0008.html", "node_id":"dataartsstudio_03_0008.xml", "product_code":"dataartsstudio", - "code":"351", - "des":"For details about the data connections supported by DataArts Studio, see Data Sources Supported by DataArts Studio.", + "code":"358", + "des":"DataArts Studio can interconnect with cloud services such as GaussDB(DWS), DLI, and MRS Hive as well as traditional databases such as MySQL and . For details, see Data So", "doc_type":"usermanual", - "kw":"Which Data Connections Are Supported by DataArts Studio?,Management Center,User Guide", + "kw":"Which Data Sources Can DataArts Studio Connect To?,Management Center,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Which Data Connections Are Supported by DataArts Studio?", + "title":"Which Data Sources Can DataArts Studio Connect To?", "githuburl":"" }, { "uri":"dataartsstudio_03_0009.html", "node_id":"dataartsstudio_03_0009.xml", "product_code":"dataartsstudio", - "code":"352", - "des":"When creating a DWS, MRS Hive, RDS, and SparkSQL data connection, you must bind an agent provided by the CDM cluster. Currently, a version of the CDM cluster earlier than", + "code":"359", + "des":"RDS data connections depend on OBS. If OBS is unavailable in the same region as DataArts Studio, RDS data connections are not supported.For host connections, only Linux h", "doc_type":"usermanual", "kw":"What Are the Precautions for Creating Data Connections?,Management Center,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Are the Precautions for Creating Data Connections?", @@ -7394,37 +7554,39 @@ "uri":"dataartsstudio_03_0016.html", "node_id":"dataartsstudio_03_0016.xml", "product_code":"dataartsstudio", - "code":"353", + "code":"360", "des":"The possible cause is that the CDM cluster is stopped or a concurrency conflict occurs. You can switch to another agent to temporarily avoid this issue.To resolve this is", "doc_type":"usermanual", - "kw":"Why Do DWS/Hive/HBase Data Connections Fail to Obtain the Information About Database or Tables?,Mana", + "kw":"What Should I Do If Database or Table Information Cannot Be Obtained Through a GaussDB(DWS)/Hive/HBa", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Why Do DWS/Hive/HBase Data Connections Fail to Obtain the Information About Database or Tables?", + "title":"What Should I Do If Database or Table Information Cannot Be Obtained Through a GaussDB(DWS)/Hive/HBase Data Connection?", "githuburl":"" }, { "uri":"dataartsstudio_03_0017.html", "node_id":"dataartsstudio_03_0017.xml", "product_code":"dataartsstudio", - "code":"354", - "des":"Possible causes are as follows:Hive/HBase components were not selected during MRS cluster creation.The network between the CDM cluster and MRS cluster was disconnected wh", + "code":"361", + "des":"Possible causes are as follows:Hive/HBase components were not selected during MRS cluster creation.The enterprise project selected during MRS cluster creation is differen", "doc_type":"usermanual", "kw":"Why Are MRS Hive/HBase Clusters Not Displayed on the Page for Creating Data Connections?,Management ", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Are MRS Hive/HBase Clusters Not Displayed on the Page for Creating Data Connections?", @@ -7434,77 +7596,81 @@ "uri":"dataartsstudio_03_0054.html", "node_id":"dataartsstudio_03_0054.xml", "product_code":"dataartsstudio", - "code":"355", - "des":"The failure may be caused by the rights separation function of the DWS cluster. On the DWS console, click the corresponding cluster, choose Security Settings, and disable", + "code":"362", + "des":"The failure may be caused by the rights separation function of the GaussDB(DWS) cluster.On the DWS console, click the corresponding cluster, choose Security Settings, and", "doc_type":"usermanual", - "kw":"What Should I Do If the Connection Test Fails When I Enable the SSL Connection During the Creation o", + "kw":"What Should I Do If a GaussDB(DWS) Connection Test Fails When SSL Is Enabled for the Connection?,Man", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"What Should I Do If the Connection Test Fails When I Enable the SSL Connection During the Creation of a DWS Data Connection?", + "title":"What Should I Do If a GaussDB(DWS) Connection Test Fails When SSL Is Enabled for the Connection?", "githuburl":"" }, { "uri":"dataartsstudio_03_0089.html", "node_id":"dataartsstudio_03_0089.xml", "product_code":"dataartsstudio", - "code":"356", - "des":"Multiple data connections of the same type or different types can be created in the same workspace, but their names must be unique.", + "code":"363", + "des":"Yes, but the name of each connection must be unique.To ensure that you can select the correct data connection in future development, you are advised to name the connectio", "doc_type":"usermanual", - "kw":"Can I Create Multiple Data Connections in a Workspace in Proxy Mode?,Management Center,User Guide", + "kw":"Can I Create Multiple Connections to the Same Data Source in a Workspace?,Management Center,User Gui", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Can I Create Multiple Data Connections in a Workspace in Proxy Mode?", + "title":"Can I Create Multiple Connections to the Same Data Source in a Workspace?", "githuburl":"" }, { "uri":"dataartsstudio_03_0137.html", "node_id":"dataartsstudio_03_0137.xml", "product_code":"dataartsstudio", - "code":"357", - "des":"You are advised to choose a proxy connection.", + "code":"364", + "des":"The API connection type is available only for DataArts Factory.To ensure that a connection is available for other components such as DataArts Architecture, DataArts Quali", "doc_type":"usermanual", - "kw":"Should I Choose a Direct or a Proxy Connection When Creating a DWS Connection?,Management Center,Use", + "kw":"Should I Select the API or Proxy Connection Type When Creating a Data Connection in Management Cente", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Should I Choose a Direct or a Proxy Connection When Creating a DWS Connection?", + "title":"Should I Select the API or Proxy Connection Type When Creating a Data Connection in Management Center?", "githuburl":"" }, { "uri":"dataartsstudio_03_0153.html", "node_id":"dataartsstudio_03_0153.xml", "product_code":"dataartsstudio", - "code":"358", - "des":"You can export the jobs in DataArts Factory and then import them to DataArts Factory in another workspace.You can export data connections on the Migrate Resources page of", + "code":"365", + "des":"You can export data connections and jobs from one workspace and import them to another workspace.Export and import data connections in Management Center.Export and import", "doc_type":"usermanual", "kw":"How Do I Migrate the Data Development Jobs and Data Connections from One Workspace to Another?,Manag", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Migrate the Data Development Jobs and Data Connections from One Workspace to Another?", @@ -7514,37 +7680,39 @@ "uri":"dataartsstudio_03_0027.html", "node_id":"dataartsstudio_03_0027.xml", "product_code":"dataartsstudio", - "code":"359", + "code":"366", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", - "kw":"DataArts Migration", + "kw":"DataArts Migration (CDM Jobs)", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"DataArts Migration", + "title":"DataArts Migration (CDM Jobs)", "githuburl":"" }, { "uri":"dataartsstudio_03_0139.html", "node_id":"dataartsstudio_03_0139.xml", "product_code":"dataartsstudio", - "code":"360", + "code":"367", "des":"CDM is developed based on a distributed computing framework and leverages the parallel data processing technology. Table 1 details the advantages of CDM.", "doc_type":"usermanual", - "kw":"What Are the Advantages of CDM?,DataArts Migration,User Guide", + "kw":"What Are the Advantages of CDM?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Are the Advantages of CDM?", @@ -7554,17 +7722,18 @@ "uri":"dataartsstudio_03_0140.html", "node_id":"dataartsstudio_03_0140.xml", "product_code":"dataartsstudio", - "code":"361", + "code":"368", "des":"CDM is a fully hosted service that provides the following capabilities to protect user data security:Instance isolation: CDM users can use only their own instances. Insta", "doc_type":"usermanual", - "kw":"What Are the Security Protection Mechanisms of CDM?,DataArts Migration,User Guide", + "kw":"What Are the Security Protection Mechanisms of CDM?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Are the Security Protection Mechanisms of CDM?", @@ -7574,17 +7743,18 @@ "uri":"dataartsstudio_03_0099.html", "node_id":"dataartsstudio_03_0099.xml", "product_code":"dataartsstudio", - "code":"362", + "code":"369", "des":"When migrating the data on the public network, use NAT Gateway to share the EIPs with other ECSs in the subnet. In this way, data on the on-premises data center or third-", "doc_type":"usermanual", - "kw":"How Do I Reduce the Cost of Using CDM?,DataArts Migration,User Guide", + "kw":"How Do I Reduce the Cost of Using CDM?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Reduce the Cost of Using CDM?", @@ -7594,17 +7764,18 @@ "uri":"dataartsstudio_03_0302.html", "node_id":"dataartsstudio_03_0302.xml", "product_code":"dataartsstudio", - "code":"363", + "code":"370", "des":"No. To use a later version cluster, you can create one.", "doc_type":"usermanual", - "kw":"Can I Upgrade a CDM Cluster?,DataArts Migration,User Guide", + "kw":"Can I Upgrade a CDM Cluster?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Can I Upgrade a CDM Cluster?", @@ -7614,17 +7785,18 @@ "uri":"dataartsstudio_03_0141.html", "node_id":"dataartsstudio_03_0141.xml", "product_code":"dataartsstudio", - "code":"364", + "code":"371", "des":"Theoretically, a cdm.large CDM instance can migrate 1 TB to 8 TB data per day. The actual transmission rate is affected by factors such as the Internet bandwidth, cluster", "doc_type":"usermanual", - "kw":"How Is the Migration Performance of CDM?,DataArts Migration,User Guide", + "kw":"How Is the Migration Performance of CDM?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Is the Migration Performance of CDM?", @@ -7634,17 +7806,18 @@ "uri":"dataartsstudio_03_0124.html", "node_id":"dataartsstudio_03_0124.xml", "product_code":"dataartsstudio", - "code":"365", + "code":"372", "des":"CDM migrates data through data migration jobs. It works in the following way:When data migration jobs are submitted, CDM splits each job into multiple tasks based on the ", "doc_type":"usermanual", - "kw":"What Is the Number of Concurrent Jobs for Different CDM Cluster Versions?,DataArts Migration,User Gu", + "kw":"What Is the Number of Concurrent Jobs for Different CDM Cluster Versions?,DataArts Migration (CDM Jo", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Is the Number of Concurrent Jobs for Different CDM Cluster Versions?", @@ -7654,17 +7827,18 @@ "uri":"dataartsstudio_03_0069.html", "node_id":"dataartsstudio_03_0069.xml", "product_code":"dataartsstudio", - "code":"366", - "des":"CDM supports incremental data migration. With scheduled jobs and macro variables of date and time, CDM provides incremental data migration in the following scenarios:Incr", + "code":"373", + "des":"Does CDM support incremental data migration?CDM supports incremental data migration.With scheduled jobs and macro variables of date and time, CDM provides incremental dat", "doc_type":"usermanual", - "kw":"Does CDM Support Incremental Data Migration?,DataArts Migration,User Guide", + "kw":"Does CDM Support Incremental Data Migration?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Does CDM Support Incremental Data Migration?", @@ -7674,17 +7848,18 @@ "uri":"dataartsstudio_03_0028.html", "node_id":"dataartsstudio_03_0028.xml", "product_code":"dataartsstudio", - "code":"367", + "code":"374", "des":"Yes. CDM supports the following field converters:AnonymizationTrimReverse StringReplace StringExpression ConversionYou can create a field converter on the Map Field page ", "doc_type":"usermanual", - "kw":"Does CDM Support Field Conversion?,DataArts Migration,User Guide", + "kw":"Does CDM Support Field Conversion?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Does CDM Support Field Conversion?", @@ -7694,17 +7869,18 @@ "uri":"dataartsstudio_03_0107.html", "node_id":"dataartsstudio_03_0107.xml", "product_code":"dataartsstudio", - "code":"368", + "code":"375", "des":"The recommended component versions can be used as both the source and destination.", "doc_type":"usermanual", - "kw":"What Component Versions Are Recommended for Migrating Hadoop Data Sources?,DataArts Migration,User G", + "kw":"What Component Versions Are Recommended for Migrating Hadoop Data Sources?,DataArts Migration (CDM J", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Component Versions Are Recommended for Migrating Hadoop Data Sources?", @@ -7714,17 +7890,18 @@ "uri":"dataartsstudio_03_0029.html", "node_id":"dataartsstudio_03_0029.xml", "product_code":"dataartsstudio", - "code":"369", - "des":"CDM can read and write data in SequenceFile, TextFile, ORC, or Parquet format from the Hive data source.", + "code":"376", + "des":"Which data formats are supported when the data source is Hive?CDM can read and write data in SequenceFile, TextFile, ORC, or Parquet format from the Hive data source.", "doc_type":"usermanual", - "kw":"What Data Formats Are Supported When the Data Source Is Hive?,DataArts Migration,User Guide", + "kw":"What Data Formats Are Supported When the Data Source Is Hive?,DataArts Migration (CDM Jobs),User Gui", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Data Formats Are Supported When the Data Source Is Hive?", @@ -7734,17 +7911,18 @@ "uri":"dataartsstudio_03_0030.html", "node_id":"dataartsstudio_03_0030.xml", "product_code":"dataartsstudio", - "code":"370", - "des":"CDM does not support direct job migration across clusters. However, you can use the batch job import and export function to indirectly implement cross-cluster migration a", + "code":"377", + "des":"Can I synchronize jobs to other CDM clusters?CDM does not support direct job migration across clusters. However, you can use the batch job import and export function to i", "doc_type":"usermanual", - "kw":"Can I Synchronize Jobs to Other Clusters?,DataArts Migration,User Guide", + "kw":"Can I Synchronize Jobs to Other Clusters?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Can I Synchronize Jobs to Other Clusters?", @@ -7754,17 +7932,18 @@ "uri":"dataartsstudio_03_0031.html", "node_id":"dataartsstudio_03_0031.xml", "product_code":"dataartsstudio", - "code":"371", - "des":"CDM supports batch job creation with the help of the batch import function. You can create jobs in batches as follows:Create a job manually.Export the job and save the jo", + "code":"378", + "des":"Can I create CDM jobs in batches?CDM supports batch job creation with the help of the batch import function. You can create jobs in batches as follows:Create a job manual", "doc_type":"usermanual", - "kw":"Can I Create Jobs in Batches?,DataArts Migration,User Guide", + "kw":"Can I Create Jobs in Batches?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Can I Create Jobs in Batches?", @@ -7774,17 +7953,18 @@ "uri":"dataartsstudio_03_0100.html", "node_id":"dataartsstudio_03_0100.xml", "product_code":"dataartsstudio", - "code":"372", - "des":"Yes.Access the DataArts Factory module of the DataArts Studio service.In the navigation pane of the DataArts Factory homepage, choose Data Development > Develop Job to cr", + "code":"379", + "des":"Can I schedule CDM jobs in batches?Yes.Access the DataArts Factory module of the DataArts Studio service.In the navigation pane of the DataArts Factory homepage, choose D", "doc_type":"usermanual", - "kw":"Can I Schedule Jobs in Batches?,DataArts Migration,User Guide", + "kw":"Can I Schedule Jobs in Batches?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Can I Schedule Jobs in Batches?", @@ -7794,17 +7974,18 @@ "uri":"dataartsstudio_03_0032.html", "node_id":"dataartsstudio_03_0032.xml", "product_code":"dataartsstudio", - "code":"373", - "des":"You can use the batch export function of CDM to save all job scripts to a local PC. Then, you can create a cluster and import the jobs again when necessary.", + "code":"380", + "des":"How do I back up CDM jobs?You can use the batch export function of CDM to save all job scripts to a local PC. Then, you can create a cluster and import the jobs again whe", "doc_type":"usermanual", - "kw":"How Do I Back Up CDM Jobs?,DataArts Migration,User Guide", + "kw":"How Do I Back Up CDM Jobs?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Back Up CDM Jobs?", @@ -7814,37 +7995,39 @@ "uri":"dataartsstudio_03_0119.html", "node_id":"dataartsstudio_03_0119.xml", "product_code":"dataartsstudio", - "code":"374", - "des":"To ensure that CDM can communicate with the HANA cluster, perform the following operations:Disable Statement Routing of the HANA cluster. Note that this will increase the", + "code":"381", + "des":"What should I do If only some nodes in a HANA cluster can communicate with the CDM cluster?To ensure that CDM can communicate with the HANA cluster, perform the following", "doc_type":"usermanual", - "kw":"How Do I Configure the Connection If Only Some Nodes in the HANA Cluster Can Communicate with the CD", + "kw":"What Should I Do If Only Some Nodes in a HANA Cluster Can Communicate with the CDM Cluster?,DataArts", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"How Do I Configure the Connection If Only Some Nodes in the HANA Cluster Can Communicate with the CDM Cluster?", + "title":"What Should I Do If Only Some Nodes in a HANA Cluster Can Communicate with the CDM Cluster?", "githuburl":"" }, { "uri":"dataartsstudio_03_0101.html", "node_id":"dataartsstudio_03_0101.xml", "product_code":"dataartsstudio", - "code":"375", + "code":"382", "des":"CDM provides RESTful APIs to implement automatic job creation or execution control by program invocation.The following describes how to use CDM to migrate data from table", "doc_type":"usermanual", - "kw":"How Do I Use Java to Invoke CDM RESTful APIs to Create Data Migration Jobs?,DataArts Migration,User ", + "kw":"How Do I Use Java to Invoke CDM RESTful APIs to Create Data Migration Jobs?,DataArts Migration (CDM ", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Use Java to Invoke CDM RESTful APIs to Create Data Migration Jobs?", @@ -7854,17 +8037,18 @@ "uri":"dataartsstudio_03_0033.html", "node_id":"dataartsstudio_03_0033.xml", "product_code":"dataartsstudio", - "code":"376", + "code":"383", "des":"Many enterprises deploy key data sources on the intranet, such as databases and file servers. CDM runs on the cloud. To migrate the intranet data to the cloud using CDM, ", "doc_type":"usermanual", - "kw":"How Do I Connect the On-Premises Intranet or Third-Party Private Network to CDM?,DataArts Migration,", + "kw":"How Do I Connect the On-Premises Intranet or Third-Party Private Network to CDM?,DataArts Migration ", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Connect the On-Premises Intranet or Third-Party Private Network to CDM?", @@ -7874,17 +8058,18 @@ "uri":"dataartsstudio_03_0336.html", "node_id":"dataartsstudio_03_0336.xml", "product_code":"dataartsstudio", - "code":"377", + "code":"384", "des":"CDM migrates data through data migration jobs. It works in the following way:When data migration jobs are submitted, CDM splits each job into multiple tasks based on the ", "doc_type":"usermanual", - "kw":"How Do I Set the Number of Concurrent Extractors for a CDM Migration Job?,DataArts Migration,User Gu", + "kw":"How Do I Set the Number of Concurrent Extractors for a CDM Migration Job?,DataArts Migration (CDM Jo", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Set the Number of Concurrent Extractors for a CDM Migration Job?", @@ -7894,17 +8079,18 @@ "uri":"dataartsstudio_03_0337.html", "node_id":"dataartsstudio_03_0337.xml", "product_code":"dataartsstudio", - "code":"378", - "des":"No. If data is written to the source during the migration, an error may occur.", + "code":"385", + "des":"Does CDM support real-time migration of dynamic data?No.If data is written to the source during the migration, an error may occur.", "doc_type":"usermanual", - "kw":"Does CDM Support Real-Time Migration of Dynamic Data?,DataArts Migration,User Guide", + "kw":"Does CDM Support Real-Time Migration of Dynamic Data?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Does CDM Support Real-Time Migration of Dynamic Data?", @@ -7914,17 +8100,18 @@ "uri":"dataartsstudio_03_0340.html", "node_id":"dataartsstudio_03_0340.xml", "product_code":"dataartsstudio", - "code":"379", - "des":"You can use the DateUtils.format(${timestamp()},\"yyyy-MM-dd HH:mm:ss\") expression on the Map Field page to obtain the current time.", + "code":"386", + "des":"How do I obtain the current time using an expression?You can use the DateUtils.format(${timestamp()},\"yyyy-MM-dd HH:mm:ss\") expression on the Map Field page to obtain the", "doc_type":"usermanual", - "kw":"How Do I Obtain the Current Time Using an Expression?,DataArts Migration,User Guide", + "kw":"How Do I Obtain the Current Time Using an Expression?,DataArts Migration (CDM Jobs),User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Obtain the Current Time Using an Expression?", @@ -7934,17 +8121,18 @@ "uri":"dataartsstudio_03_0106.html", "node_id":"dataartsstudio_03_0106.xml", "product_code":"dataartsstudio", - "code":"380", + "code":"387", "des":"When CDM is used to import data from OBS to SQL Server, the job fails to be executed and error message \"Unable to execute the SQL statement. Cause: \"String or binary data", "doc_type":"usermanual", "kw":"What Can I Do If Error Message \"Unable to execute the SQL statement\" Is Displayed When I Import Data", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Can I Do If Error Message \"Unable to execute the SQL statement\" Is Displayed When I Import Data from OBS to SQL Server?", @@ -7954,17 +8142,18 @@ "uri":"dataartsstudio_03_0071.html", "node_id":"dataartsstudio_03_0071.xml", "product_code":"dataartsstudio", - "code":"381", + "code":"388", "des":"When CDM is used to migrate Oracle data to DWS, an error is reported, as shown in Figure 1.During data migration, if the entire table is queried and the table contains a ", "doc_type":"usermanual", - "kw":"Why Is Error ORA-01555 Reported During Migration from Oracle to DWS?,DataArts Migration,User Guide", + "kw":"Why Is Error ORA-01555 Reported During Migration from Oracle to DWS?,DataArts Migration (CDM Jobs),U", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Is Error ORA-01555 Reported During Migration from Oracle to DWS?", @@ -7974,37 +8163,39 @@ "uri":"dataartsstudio_03_0072.html", "node_id":"dataartsstudio_03_0072.xml", "product_code":"dataartsstudio", - "code":"382", - "des":"By default, the userAdmin role has only the permissions to manage roles and users and does not have the read and write permissions on a database.If the MongoDB connection", + "code":"389", + "des":"Migration using a MongoDB connection fails.By default, the userAdmin role has only the permissions to manage roles and users and does not have the read and write permissi", "doc_type":"usermanual", - "kw":"What Should I Do If the MongoDB Connection Migration Fails?,DataArts Migration,User Guide", + "kw":"What Should I Do If Migration Using a MongoDB Connection Fails?,DataArts Migration (CDM Jobs),User G", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"What Should I Do If the MongoDB Connection Migration Fails?", + "title":"What Should I Do If Migration Using a MongoDB Connection Fails?", "githuburl":"" }, { "uri":"dataartsstudio_03_0093.html", "node_id":"dataartsstudio_03_0093.xml", "product_code":"dataartsstudio", - "code":"383", - "des":"Manually stop the Hive migration job and add the following attribute settings to the Hive data connection:Attribute Name: hive.server2.idle.operation.timeoutValue: 10mIn ", + "code":"390", + "des":"What should I do If a Hive migration job is suspended for a long period of time?Manually stop the Hive migration job and add the following attribute settings to the Hive ", "doc_type":"usermanual", - "kw":"What Should I Do If a Hive Migration Job Is Suspended for a Long Period of Time?,DataArts Migration,", + "kw":"What Should I Do If a Hive Migration Job Is Suspended for a Long Period of Time?,DataArts Migration ", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If a Hive Migration Job Is Suspended for a Long Period of Time?", @@ -8014,17 +8205,18 @@ "uri":"dataartsstudio_03_0109.html", "node_id":"dataartsstudio_03_0109.xml", "product_code":"dataartsstudio", - "code":"384", + "code":"391", "des":"When you use CDM to migrate data to DWS, the migration job fails and the error message \"value too long for type character varying\" is displayed in the execution log.The p", "doc_type":"usermanual", "kw":"What Should I Do If an Error Is Reported Because the Field Type Mapping Does Not Match During Data M", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If an Error Is Reported Because the Field Type Mapping Does Not Match During Data Migration Using CDM?", @@ -8034,17 +8226,18 @@ "uri":"dataartsstudio_03_0110.html", "node_id":"dataartsstudio_03_0110.xml", "product_code":"dataartsstudio", - "code":"385", - "des":"The following error message is displayed during MySQL migration: \"Unable to connect to the database server. Cause: connect timed out.\"The table has a large data volume, a", + "code":"392", + "des":"The following error message is displayed during MySQL migration: \"Unable to connect to the database server. Cause: connect timed out\"The table has a large data volume, an", "doc_type":"usermanual", "kw":"What Should I Do If a JDBC Connection Timeout Error Is Reported During MySQL Migration?,DataArts Mig", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If a JDBC Connection Timeout Error Is Reported During MySQL Migration?", @@ -8054,37 +8247,39 @@ "uri":"dataartsstudio_03_0121.html", "node_id":"dataartsstudio_03_0121.xml", "product_code":"dataartsstudio", - "code":"386", - "des":"You are advised to clear historical data and try again. In addition, when creating a migration job, you are advised to enable the system to clear historical data. This gr", + "code":"393", + "des":"A CDM migration job fails after a link from Hive to GaussDB(DWS) is created.You are advised to clear historical data and try again. In addition, when creating a migration", "doc_type":"usermanual", - "kw":"What Should I Do If a CDM Migration Job Fails After a Link from Hive to DWS Is Created?,DataArts Mig", + "kw":"What Should I Do If a CDM Migration Job Fails After a Link from Hive to GaussDB(DWS) Is Created?,Dat", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"What Should I Do If a CDM Migration Job Fails After a Link from Hive to DWS Is Created?", + "title":"What Should I Do If a CDM Migration Job Fails After a Link from Hive to GaussDB(DWS) Is Created?", "githuburl":"" }, { "uri":"dataartsstudio_03_0122.html", "node_id":"dataartsstudio_03_0122.xml", "product_code":"dataartsstudio", - "code":"387", - "des":"CDM does not support this operation. You are advised to manually export a MySQL data file, enable the SFTP service on the server, and create a CDM job with SFTP as the so", + "code":"394", + "des":"How do I use CDM to export MySQL data to an SQL file and upload the file to an OBS bucket?CDM does not support this operation. You are advised to manually export a MySQL ", "doc_type":"usermanual", "kw":"How Do I Use CDM to Export MySQL Data to an SQL File and Upload the File to an OBS Bucket?,DataArts ", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Use CDM to Export MySQL Data to an SQL File and Upload the File to an OBS Bucket?", @@ -8094,17 +8289,18 @@ "uri":"dataartsstudio_03_0123.html", "node_id":"dataartsstudio_03_0123.xml", "product_code":"dataartsstudio", - "code":"388", - "des":"Dirty data writing is configured, but no dirty data exists. You need to decrease the number of concurrent tasks to avoid this issue.", + "code":"395", + "des":"CDM fails to migrate data from OBS to DLI.Dirty data writing is configured, but no dirty data exists. You need to decrease the number of concurrent tasks to avoid this is", "doc_type":"usermanual", - "kw":"What Should I Do If CDM Fails to Migrate Data from OBS to DLI?,DataArts Migration,User Guide", + "kw":"What Should I Do If CDM Fails to Migrate Data from OBS to DLI?,DataArts Migration (CDM Jobs),User Gu", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If CDM Fails to Migrate Data from OBS to DLI?", @@ -8114,17 +8310,18 @@ "uri":"dataartsstudio_03_0132.html", "node_id":"dataartsstudio_03_0132.xml", "product_code":"dataartsstudio", - "code":"389", + "code":"396", "des":"This error is reported because the customer's certificate has expired. Update the certificate and reconfigure the connector.", "doc_type":"usermanual", "kw":"What Should I Do If a CDM Connector Reports the Error \"Configuration Item [linkConfig.iamAuth] Does ", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If a CDM Connector Reports the Error \"Configuration Item [linkConfig.iamAuth] Does Not Exist\"?", @@ -8134,17 +8331,18 @@ "uri":"dataartsstudio_03_0333.html", "node_id":"dataartsstudio_03_0333.xml", "product_code":"dataartsstudio", - "code":"390", - "des":"If you create a link or save a job in a CDM cluster of an earlier version, and then access a CDM cluster of a later version, this error occurs occasionally.Manually clear", + "code":"397", + "des":"Error message \"Configuration Item [linkConfig.createBackendLinks] Does Not Exist\" or \"Configuration Item [throttlingConfig.concurrentSubJobs] Does Not Exist\" is displayed", "doc_type":"usermanual", "kw":"What Should I Do If Error \"Configuration Item [linkConfig.createBackendLinks] Does Not Exist\" or \"Co", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Error \"Configuration Item [linkConfig.createBackendLinks] Does Not Exist\" or \"Configuration Item [throttlingConfig.concurrentSubJobs] Does Not Exist\" Is Reported?", @@ -8154,17 +8352,18 @@ "uri":"dataartsstudio_03_0166.html", "node_id":"dataartsstudio_03_0166.xml", "product_code":"dataartsstudio", - "code":"391", - "des":"This failure occurs because you do not have the required permissions. Create another service user, grant the required permissions to it, and try again.To create a data co", + "code":"398", + "des":"Message \"CORE_0031:Connect time out. (Cdm.0523)\" is displayed during the creation of an MRS Hive link.If a message is displayed indicating that the configuration file can", "doc_type":"usermanual", "kw":"What Should I Do If Message \"CORE_0031:Connect time out. (Cdm.0523)\" Is Displayed During the Creatio", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Message \"CORE_0031:Connect time out. (Cdm.0523)\" Is Displayed During the Creation of an MRS Hive Link?", @@ -8174,17 +8373,18 @@ "uri":"dataartsstudio_03_0167.html", "node_id":"dataartsstudio_03_0167.xml", "product_code":"dataartsstudio", - "code":"392", - "des":"The cause is that the database table name contains special characters, resulting in incorrect syntax. You can resolve this issue by renaming the database table according ", + "code":"399", + "des":"Message \"CDM Does Not Support Auto Creation of an Empty Table with No Column\" is displayed when I enable auto table creation.The cause is that the database table name con", "doc_type":"usermanual", "kw":"What Should I Do If Message \"CDM Does Not Support Auto Creation of an Empty Table with No Column\" Is", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Message \"CDM Does Not Support Auto Creation of an Empty Table with No Column\" Is Displayed When I Enable Auto Table Creation?", @@ -8194,17 +8394,18 @@ "uri":"dataartsstudio_03_0334.html", "node_id":"dataartsstudio_03_0334.xml", "product_code":"dataartsstudio", - "code":"393", - "des":"This may be because you have uploaded the latest ORACLE_8 driver (for example, Oracle Database 21c (21.3) driver), which is not supported yet. You are advised to use the ", + "code":"400", + "des":"I cannot obtain the schema name when creating an Oracle relational database migration job.The latest ORACLE_8 driver, which is not supported, may have been uploaded, for ", "doc_type":"usermanual", "kw":"What Should I Do If I Cannot Obtain the Schema Name When Creating an Oracle Relational Database Migr", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If I Cannot Obtain the Schema Name When Creating an Oracle Relational Database Migration Job?", @@ -8214,17 +8415,18 @@ "uri":"dataartsstudio_03_0341.html", "node_id":"dataartsstudio_03_0341.xml", "product_code":"dataartsstudio", - "code":"394", + "code":"401", "des":"The MySQL database stores values 0 and 1, rather than true and false. However, true or false is read during MySQL database migration, and the following error information ", "doc_type":"usermanual", "kw":"What Should I Do If invalid input syntax for integer: \"true\" Is Displayed During MySQL Database Migr", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If invalid input syntax for integer: \"true\" Is Displayed During MySQL Database Migration?", @@ -8234,17 +8436,18 @@ "uri":"dataartsstudio_03_0035.html", "node_id":"dataartsstudio_03_0035.xml", "product_code":"dataartsstudio", - "code":"395", + "code":"402", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"DataArts Factory", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"DataArts Factory", @@ -8254,17 +8457,18 @@ "uri":"dataartsstudio_03_0036.html", "node_id":"dataartsstudio_03_0036.xml", "product_code":"dataartsstudio", - "code":"396", - "des":"By default, each user can create a maximum of 10,000 jobs, and each job can contain a maximum of 200 nodes.", + "code":"403", + "des":"Whether the number of jobs and the number of nodes in a job are limited during data developmentBy default, each user can create a maximum of 10,000 jobs, and each job can", "doc_type":"usermanual", "kw":"How Many Jobs Can Be Created in DataArts Factory? Is There a Limit on the Number of Nodes in a Job?,", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Many Jobs Can Be Created in DataArts Factory? Is There a Limit on the Number of Nodes in a Job?", @@ -8274,17 +8478,18 @@ "uri":"dataartsstudio_03_0126.html", "node_id":"dataartsstudio_03_0126.xml", "product_code":"dataartsstudio", - "code":"397", - "des":"Yes.", + "code":"404", + "des":"Whether DataArts Studio supports custom Python scriptsYes.", "doc_type":"usermanual", "kw":"Does DataArts Studio Support Custom Python Scripts?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Does DataArts Studio Support Custom Python Scripts?", @@ -8294,17 +8499,18 @@ "uri":"dataartsstudio_03_0041.html", "node_id":"dataartsstudio_03_0041.xml", "product_code":"dataartsstudio", - "code":"398", - "des":"On the Running History page, there is a large difference between Job Execution Time and Start Time, as shown in the figure below. Job Execution Time is the time when the ", + "code":"405", + "des":"On the Running History page, there is a large difference between Job Execution Time and Start Time. Job Execution Time is the time when the job is expected to be executed", "doc_type":"usermanual", "kw":"Why Is There a Large Difference Between Job Execution Time and Start Time of a Job?,DataArts Factory", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Is There a Large Difference Between Job Execution Time and Start Time of a Job?", @@ -8314,17 +8520,18 @@ "uri":"dataartsstudio_03_0042.html", "node_id":"dataartsstudio_03_0042.xml", "product_code":"dataartsstudio", - "code":"399", - "des":"The subsequent jobs may be suspended, continued, or canceled, depending on the configuration.In this case, do not stop the job. You can rerun the failed job instance or s", + "code":"406", + "des":"One of the jobs that depend on each other fails during scheduling.The subsequent jobs may be suspended, continued, or canceled, depending on the configuration.In this cas", "doc_type":"usermanual", "kw":"Will Subsequent Jobs Be Affected If a Job Fails to Be Executed During Scheduling of Dependent Jobs? ", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Will Subsequent Jobs Be Affected If a Job Fails to Be Executed During Scheduling of Dependent Jobs? What Should I Do?", @@ -8334,17 +8541,18 @@ "uri":"dataartsstudio_03_0149.html", "node_id":"dataartsstudio_03_0149.xml", "product_code":"dataartsstudio", - "code":"400", - "des":"Lock management is unavailable for DLI and MRS. Therefore, if you perform read and write operations on the tables simultaneously, data conflict will occur and the operati", + "code":"407", + "des":"Notes for scheduling big data services using DataArts StudioLock management is unavailable for DLI and MRS. Therefore, if you perform read and write operations on the tab", "doc_type":"usermanual", "kw":"What Should I Pay Attention to When Using DataArts Studio to Schedule Big Data Services?,DataArts Fa", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Pay Attention to When Using DataArts Studio to Schedule Big Data Services?", @@ -8354,57 +8562,60 @@ "uri":"dataartsstudio_03_0136.html", "node_id":"dataartsstudio_03_0136.xml", "product_code":"dataartsstudio", - "code":"401", - "des":"Parameters can be set in environment variables, job parameters, and script parameters, but their application scopes are different. If there is a conflict when parameters ", + "code":"408", + "des":"Differences and relationships between environment variables, job parameters, and script parametersThe application scopes of workspace environment variables, job parameter", "doc_type":"usermanual", - "kw":"What Are the Differences and Connections Among Environment Variables, Job Parameters, and Script Par", + "kw":"What Are the Differences and Relationships Between Environment Variables, Job Parameters, and Script", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"What Are the Differences and Connections Among Environment Variables, Job Parameters, and Script Parameters?", + "title":"What Are the Differences and Relationships Between Environment Variables, Job Parameters, and Script Parameters?", "githuburl":"" }, { "uri":"dataartsstudio_03_0050.html", "node_id":"dataartsstudio_03_0050.xml", "product_code":"dataartsstudio", - "code":"402", - "des":"Job logs are stored in OBS buckets. You must configure the bucket directory for storing job logs in the workspace and check whether the your account has the OBS read perm", + "code":"409", + "des":"You do not have the required permissions.Job logs are stored in OBS buckets. You must configure the bucket directory for storing job logs in the workspace and check wheth", "doc_type":"usermanual", - "kw":"What Should I Do If Job Logs Cannot Be Opened and Error 404 Is Reported?,DataArts Factory,User Guide", + "kw":"What Should I Do If a Job Log Cannot Be Opened and Error 404 Is Reported?,DataArts Factory,User Guid", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"What Should I Do If Job Logs Cannot Be Opened and Error 404 Is Reported?", + "title":"What Should I Do If a Job Log Cannot Be Opened and Error 404 Is Reported?", "githuburl":"" }, { "uri":"dataartsstudio_03_0051.html", "node_id":"dataartsstudio_03_0051.xml", "product_code":"dataartsstudio", - "code":"403", - "des":"When a workspace- or job-level agency is configured, the following error is reported when the agency list is viewed:Policy doesn't allow iam:agencies:listAgencies to be p", + "code":"410", + "des":"If error message \"Policy doesn't allow iam:agencies:listAgencies to be performed.\" is displayed when you are creating a workspace-level or job-level agency, you may lack ", "doc_type":"usermanual", "kw":"What Should I Do If the Agency List Fails to Be Obtained During Agency Configuration?,DataArts Facto", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If the Agency List Fails to Be Obtained During Agency Configuration?", @@ -8414,37 +8625,39 @@ "uri":"dataartsstudio_03_0056.html", "node_id":"dataartsstudio_03_0056.xml", "product_code":"dataartsstudio", - "code":"404", - "des":"Ensure that the current instance and peripheral resources are in the same region and IAM project. If the enterprise project function is enabled for your account, the curr", + "code":"411", + "des":"The specified peripheral resources may not be in the same region as the instance.Ensure that the current DataArts Studio instance and peripheral resources are in the same", "doc_type":"usermanual", - "kw":"Why Cannot Specified Peripheral Resources Be Selected When a Data Connection Is Created in Data Deve", + "kw":"Why Can't I Select Specified Peripheral Resources When Creating a Data Connection in DataArts Factor", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Why Cannot Specified Peripheral Resources Be Selected When a Data Connection Is Created in Data Development?", + "title":"Why Can't I Select Specified Peripheral Resources When Creating a Data Connection in DataArts Factory?", "githuburl":"" }, { "uri":"dataartsstudio_03_0058.html", "node_id":"dataartsstudio_03_0058.xml", "product_code":"dataartsstudio", - "code":"405", - "des":"On the Data Development page, choose MonitoringMonitor Job to check whether the target job is being scheduled. A job can be scheduled only within the scheduling period.Vi", + "code":"412", + "des":"Why Is There No Job Running Scheduling Log on the Monitor Instance Page After Periodic Scheduling Is Configured for a Job? This job has not been started or the job on whi", "doc_type":"usermanual", "kw":"Why Is There No Job Running Scheduling Log on the Monitor Instance Page After Periodic Scheduling Is", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Is There No Job Running Scheduling Log on the Monitor Instance Page After Periodic Scheduling Is Configured for a Job?", @@ -8454,57 +8667,60 @@ "uri":"dataartsstudio_03_0059.html", "node_id":"dataartsstudio_03_0059.xml", "product_code":"dataartsstudio", - "code":"406", - "des":"Check whether the data connection used by the Hive SQL and Spark SQL scripts is direct connection or proxy connection.In direct connection mode, DataArts Studio users sub", + "code":"413", + "des":"This issue may be caused by the connection mode.Check whether the data connection used by the Hive SQL and Spark SQL scripts is an MRS API connection or proxy connection.", "doc_type":"usermanual", - "kw":"Why does the GUI display only the failure result but not the specific error cause after Hive SQL and", + "kw":"Why Isn't the Error Cause Displayed on the Console When a Hive SQL or Spark SQL Scripts Fails?,DataA", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Why does the GUI display only the failure result but not the specific error cause after Hive SQL and Spark SQL scripts fail to be executed?", + "title":"Why Isn't the Error Cause Displayed on the Console When a Hive SQL or Spark SQL Scripts Fails?", "githuburl":"" }, { "uri":"dataartsstudio_03_0060.html", "node_id":"dataartsstudio_03_0060.xml", "product_code":"dataartsstudio", - "code":"407", - "des":"Check whether the permissions of the current user in IAM are changed, whether the user is removed from the user group, or whether the permission policy of the user group ", + "code":"414", + "des":"During the execution of a data development node, a message is displayed indicating that the token is invalid.Check whether the permissions of the current user in IAM are ", "doc_type":"usermanual", - "kw":"What Do I Do If the Token Is Invalid During the Running of a Data Development Node?,DataArts Factory", + "kw":"What Should I Do If the Token Is Invalid During the Execution of a Data Development Node?,DataArts F", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"What Do I Do If the Token Is Invalid During the Running of a Data Development Node?", + "title":"What Should I Do If the Token Is Invalid During the Execution of a Data Development Node?", "githuburl":"" }, { "uri":"dataartsstudio_03_0062.html", "node_id":"dataartsstudio_03_0062.xml", "product_code":"dataartsstudio", - "code":"408", - "des":"Method 1: After the node test is complete, right-click the current node and choose View Log from the shortcut menu.Method 2: Click Monitorin the upper part of the canvas,", + "code":"415", + "des":"How to view run logs after testing a jobMethod 1: After the node test is complete, right-click the current node and choose View Log from the shortcut menu.Method 2: Click", "doc_type":"usermanual", "kw":"How Do I View Run Logs After a Job Is Tested?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I View Run Logs After a Job Is Tested?", @@ -8514,17 +8730,18 @@ "uri":"dataartsstudio_03_0063.html", "node_id":"dataartsstudio_03_0063.xml", "product_code":"dataartsstudio", - "code":"409", - "des":"Jobs scheduled by month depend on jobs scheduled by day. Why does a job scheduled by month start running before the job scheduled by day is complete?Although jobs schedul", + "code":"416", + "des":"The monthly job depends on daily jobs of the previous month rather than the current month.Jobs scheduled by month depend on jobs scheduled by day. Why does a job schedule", "doc_type":"usermanual", "kw":"Why Does a Job Scheduled by Month Start Running Before the Job Scheduled by Day Is Complete?,DataArt", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Does a Job Scheduled by Month Start Running Before the Job Scheduled by Day Is Complete?", @@ -8534,17 +8751,18 @@ "uri":"dataartsstudio_03_0065.html", "node_id":"dataartsstudio_03_0065.xml", "product_code":"dataartsstudio", - "code":"410", - "des":"Check whether the current user has the DLI Service User or DLI Service Admin permissions in IAM.", + "code":"417", + "des":"This issue may be caused by insufficient permissions.Check whether the current user has the DLI Service User or DLI Service Admin permissions in IAM.", "doc_type":"usermanual", "kw":"What Should I Do If Invalid Authentication Is Reported When I Run a DLI Script?,DataArts Factory,Use", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Invalid Authentication Is Reported When I Run a DLI Script?", @@ -8554,37 +8772,39 @@ "uri":"dataartsstudio_03_0066.html", "node_id":"dataartsstudio_03_0066.xml", "product_code":"dataartsstudio", - "code":"411", - "des":"Check whether the CDM cluster is stopped. If it is stopped, restart it.", + "code":"418", + "des":"The CDM cluster may be stopped.Check whether the CDM cluster is stopped. If it is stopped, restart it.", "doc_type":"usermanual", - "kw":"Why Cannot I Select the Desired CDM Cluster in Proxy Mode When Creating a Data Connection?,DataArts ", + "kw":"Why Cannot I Select a Desired CDM Cluster in Proxy Mode When Creating a Data Connection?,DataArts Fa", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Why Cannot I Select the Desired CDM Cluster in Proxy Mode When Creating a Data Connection?", + "title":"Why Cannot I Select a Desired CDM Cluster in Proxy Mode When Creating a Data Connection?", "githuburl":"" }, { "uri":"dataartsstudio_03_0111.html", "node_id":"dataartsstudio_03_0111.xml", "product_code":"dataartsstudio", - "code":"412", + "code":"419", "des":"Daily scheduling is configured for the job, but there is no job scheduling record in the instance.Cause 1: Check whether the job scheduling is started. If not, the job wi", "doc_type":"usermanual", "kw":"Why Is There No Job Running Scheduling Record After Daily Scheduling Is Configured for the Job?,Data", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Is There No Job Running Scheduling Record After Daily Scheduling Is Configured for the Job?", @@ -8594,17 +8814,18 @@ "uri":"dataartsstudio_03_0112.html", "node_id":"dataartsstudio_03_0112.xml", "product_code":"dataartsstudio", - "code":"413", + "code":"420", "des":"There is no content contained in the job log.If the bucket directory for storing job logs has been configured in the workspace, check whether you have the global permissi", "doc_type":"usermanual", "kw":"What Do I Do If No Content Is Displayed in Job Logs?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Do I Do If No Content Is Displayed in Job Logs?", @@ -8614,17 +8835,18 @@ "uri":"dataartsstudio_03_0113.html", "node_id":"dataartsstudio_03_0113.xml", "product_code":"dataartsstudio", - "code":"414", + "code":"421", "des":"Two jobs are created, but the dependency relationship cannot be established.Check whether the two jobs' recurrence are both every week or every month. Currently, if the t", "doc_type":"usermanual", "kw":"Why Do I Fail to Establish a Dependency Between Two Jobs?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Do I Fail to Establish a Dependency Between Two Jobs?", @@ -8634,57 +8856,60 @@ "uri":"dataartsstudio_03_0114.html", "node_id":"dataartsstudio_03_0114.xml", "product_code":"dataartsstudio", - "code":"415", - "des":"An error is reported when DataArts Studio executes scheduling: The job does not have a submitted version. Submit the job version first.Job scheduling process begins befor", + "code":"422", + "des":"An error is reported during job scheduling in DataArts Studio, indicating that the job has not been submitted.Job scheduling process begins before the version is submitte", "doc_type":"usermanual", - "kw":"What Should I Do If an Error Is Displayed During DataArts Studio Scheduling: The Job Does Not Have a", + "kw":"What Should I Do If an Error Is Reported During Job Scheduling in DataArts Studio, Indicating that t", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"What Should I Do If an Error Is Displayed During DataArts Studio Scheduling: The Job Does Not Have a Submitted Version?", + "title":"What Should I Do If an Error Is Reported During Job Scheduling in DataArts Studio, Indicating that the Job Has Not Been Submitted?", "githuburl":"" }, { "uri":"dataartsstudio_03_0115.html", "node_id":"dataartsstudio_03_0115.xml", "product_code":"dataartsstudio", - "code":"416", + "code":"423", "des":"An error is reported when DataArts Studio executes scheduling: The script associated with node XXX in the job is not submitted.Job scheduling process begins before the sc", "doc_type":"usermanual", - "kw":"What Do I Do If an Error Is Displayed During DataArts Studio Scheduling: The Script Associated with ", + "kw":"What Should I Do If an Error Is Reported During Job Scheduling in DataArts Studio, Indicating that t", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"What Do I Do If an Error Is Displayed During DataArts Studio Scheduling: The Script Associated with Node XXX in the Job Is Not Submitted?", + "title":"What Should I Do If an Error Is Reported During Job Scheduling in DataArts Studio, Indicating that the Script Associated with Node XXX in the Job Has Not Been Submitted?", "githuburl":"" }, { "uri":"dataartsstudio_03_0116.html", "node_id":"dataartsstudio_03_0116.xml", "product_code":"dataartsstudio", - "code":"417", + "code":"424", "des":"After a job is submitted for scheduling, the job fails to be executed and the following error is displayed \"depend job [XXX] is not running or pause\".The upstream depende", "doc_type":"usermanual", "kw":"What Should I Do If a Job Fails to Be Executed After Being Submitted for Scheduling and an Error Dis", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If a Job Fails to Be Executed After Being Submitted for Scheduling and an Error Displayed: Depend Job [XXX] Is Not Running Or Pause?", @@ -8694,97 +8919,102 @@ "uri":"dataartsstudio_03_0127.html", "node_id":"dataartsstudio_03_0127.xml", "product_code":"dataartsstudio", - "code":"418", - "des":"Databases and data tables can be created in DLI.A database does not correspond to a data connection. A data connection is a connection channel for creating DataArts Studi", + "code":"425", + "des":"This section describes how to create databases and data tables, and the relationship between databases and data connections.You can create databases and data tables in Da", "doc_type":"usermanual", - "kw":"How Do I Create a Database And Data Table? Is the database a data connection?,DataArts Factory,User ", + "kw":"How Do I Create Databases and Data Tables? Do Databases Correspond to Data Connections?,DataArts Fac", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"How Do I Create a Database And Data Table? Is the database a data connection?", + "title":"How Do I Create Databases and Data Tables? Do Databases Correspond to Data Connections?", "githuburl":"" }, { "uri":"dataartsstudio_03_0129.html", "node_id":"dataartsstudio_03_0129.xml", "product_code":"dataartsstudio", - "code":"419", - "des":"Solution: Clear the cache data and use the direct connection to display the data.", + "code":"426", + "des":"The connection mode may be incorrect.Clear the cache data and use the direct connection to display the data.", "doc_type":"usermanual", - "kw":"Why Is No Result Displayed After an HIVE Task Is Executed?,DataArts Factory,User Guide", + "kw":"Why Is No Result Displayed After a Hive Task Is Executed?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Why Is No Result Displayed After an HIVE Task Is Executed?", + "title":"Why Is No Result Displayed After a Hive Task Is Executed?", "githuburl":"" }, { "uri":"dataartsstudio_03_0135.html", "node_id":"dataartsstudio_03_0135.xml", "product_code":"dataartsstudio", - "code":"420", - "des":"The last instance status indicates a job has been executed, and the status can only be successful or failed. The Monitor Instance page displays all statuses of the job, i", + "code":"427", + "des":"The Last Instance Status on the Monitor Instance page is either successful or failed.The last instance status indicates a job has been executed, and the status can only b", "doc_type":"usermanual", - "kw":"Why Does the Last Instance Status On the Monitor Instance page Only Display Succeeded or Failed?,Dat", + "kw":"Why Is the Last Instance Status On the Monitor Instance Page Either Successful or Failed?,DataArts F", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Why Does the Last Instance Status On the Monitor Instance page Only Display Succeeded or Failed?", + "title":"Why Is the Last Instance Status On the Monitor Instance Page Either Successful or Failed?", "githuburl":"" }, { "uri":"dataartsstudio_03_0148.html", "node_id":"dataartsstudio_03_0148.xml", "product_code":"dataartsstudio", - "code":"421", - "des":"Choose Monitoring > Monitor Job and click the Batch Job Monitoring tab.Select the jobs to be configured and click Configure Notification.Creating a notificationSet notifi", + "code":"428", + "des":"How to configure notifications for all jobsOn the DataArts Studio console, locate a workspace and click DataArts Factory.In the navigation pane on the left, choose Monito", "doc_type":"usermanual", - "kw":"How Do I Create a Notification for All Jobs?,DataArts Factory,User Guide", + "kw":"How Do I Configure Notifications for All Jobs?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"How Do I Create a Notification for All Jobs?", + "title":"How Do I Configure Notifications for All Jobs?", "githuburl":"" }, { "uri":"dataartsstudio_03_0193.html", "node_id":"dataartsstudio_03_0193.xml", "product_code":"dataartsstudio", - "code":"422", - "des":"Currently, the time zone of a DataArts Studio instance cannot be changed.During the scheduling of data development jobs, an EL expression can be used to adapt to the loca", + "code":"429", + "des":"Whether the time zone of a DataArts Studio instance can be changed. If not, how can the time of a DataArts Studio instance be adapted to the local time.Currently, the tim", "doc_type":"usermanual", "kw":"Can I Change the Time Zone of a DataArts Studio Instance?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Can I Change the Time Zone of a DataArts Studio Instance?", @@ -8794,17 +9024,18 @@ "uri":"dataartsstudio_03_0194.html", "node_id":"dataartsstudio_03_0194.xml", "product_code":"dataartsstudio", - "code":"423", - "des":"After renaming a CDM job, you need to select the renamed CDM job in the CDM node attributes on the DataArts Factory console.", + "code":"430", + "des":"Updated names of CDM jobs cannot be synchronized to DataArts Factory.After renaming a CDM job, you need to select the renamed CDM job in the CDM node attributes on the Da", "doc_type":"usermanual", "kw":"How Do I Synchronize the Changed Names of CDM Jobs to DataArts Factory?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Synchronize the Changed Names of CDM Jobs to DataArts Factory?", @@ -8814,17 +9045,18 @@ "uri":"dataartsstudio_03_0400.html", "node_id":"dataartsstudio_03_0400.xml", "product_code":"dataartsstudio", - "code":"424", - "des":"By default, the hll plug-in is created in the public schema. The SQL statement must contain the schema to which the hll belongs.", + "code":"431", + "des":"An RDS SQL statement fails to be executed and an error is reported indicating that hll does not exist.By default, the hll plug-in is created in the public schema. The SQL", "doc_type":"usermanual", "kw":"Why Does the Execution of an RDS SQL Statement Fail and an Error Is Reported Indicating That hll Doe", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Does the Execution of an RDS SQL Statement Fail and an Error Is Reported Indicating That hll Does Not Exist?", @@ -8834,17 +9066,18 @@ "uri":"dataartsstudio_03_0402.html", "node_id":"dataartsstudio_03_0402.xml", "product_code":"dataartsstudio", - "code":"425", + "code":"432", "des":"If the number of incorrect password attempts for connecting to the DWS cluster reaches the value of failed_login_attempts (10 by default), the account is automatically lo", "doc_type":"usermanual", "kw":"What Should I Do If Error Message \"The account has been locked\" Is Displayed When I Am Creating a DW", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Error Message \"The account has been locked\" Is Displayed When I Am Creating a DWS Data Connection?", @@ -8854,37 +9087,39 @@ "uri":"dataartsstudio_03_0403.html", "node_id":"dataartsstudio_03_0403.xml", "product_code":"dataartsstudio", - "code":"426", - "des":"Some jobs on which this job instance depends failed. You can click the question mark (?) on the right of the instance status to view the failed jobs.", + "code":"433", + "des":"A job instance is canceled and message \"The node start execute failed, so the current node status is set to cancel.\" is displayed.Some jobs on which this job depends fail", "doc_type":"usermanual", - "kw":"Why Is a Job Instance Canceled and Message \"The node start execute failed, so the current node statu", + "kw":"What Should I Do If a Job Instance Is Canceled and Message \"The node start execute failed, so the cu", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], - "title":"Why Is a Job Instance Canceled and Message \"The node start execute failed, so the current node status is set to cancel.\" Displayed?", + "title":"What Should I Do If a Job Instance Is Canceled and Message \"The node start execute failed, so the current node status is set to cancel.\" Is Displayed?", "githuburl":"" }, { "uri":"dataartsstudio_03_0404.html", "node_id":"dataartsstudio_03_0404.xml", "product_code":"dataartsstudio", - "code":"427", - "des":"Add the project ID to the request header in the code, that is, header.add(\"X-Project-Id\",Project ID).", + "code":"434", + "des":"Error message \"Workspace does not exists\" is displayed when I call a DataArts Factory API.Add the project ID to the request header in the code, that is, header.add(\"X-Pro", "doc_type":"usermanual", "kw":"What Should I Do If Error Message \"Workspace does not exists\" Is Displayed When I Call a DataArts Fa", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Error Message \"Workspace does not exists\" Is Displayed When I Call a DataArts Factory API?", @@ -8894,17 +9129,18 @@ "uri":"dataartsstudio_03_0405.html", "node_id":"dataartsstudio_03_0405.xml", "product_code":"dataartsstudio", - "code":"428", - "des":"The connector (&) for URL parameters must be escaped.", + "code":"435", + "des":"The URL parameters for calling an API take effect in the test environment when the API can be called properly using Postman.Escape the connector (&) for URL parameters.", "doc_type":"usermanual", "kw":"Why Don't the URL Parameters for Calling an API Take Effect in the Test Environment When the API Can", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Don't the URL Parameters for Calling an API Take Effect in the Test Environment When the API Can Be Called Properly Using Postman?", @@ -8914,17 +9150,18 @@ "uri":"dataartsstudio_03_0406.html", "node_id":"dataartsstudio_03_0406.xml", "product_code":"dataartsstudio", - "code":"429", - "des":"Use a CDM cluster of version 2.8.6 or a later version when creating a host connection.", + "code":"436", + "des":"The version of the CDM cluster selected during host connection creation may be too early.Use a CDM cluster of version 2.8.6 or a later version when creating a host connec", "doc_type":"usermanual", "kw":"What Should I Do If Error Message \"Agent need to be updated?\" Is Displayed When I Run a Python Scrip", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Error Message \"Agent need to be updated?\" Is Displayed When I Run a Python Script?", @@ -8934,17 +9171,18 @@ "uri":"dataartsstudio_03_0407.html", "node_id":"dataartsstudio_03_0407.xml", "product_code":"dataartsstudio", - "code":"430", - "des":"The Succeed operation was performed on the node, which changed the job instance (and node) status to successful.", + "code":"437", + "des":"An execution failure is displayed for a node whose status is successful.The Succeed operation was performed on the node, which changed the job instance (and node) status ", "doc_type":"usermanual", "kw":"Why Is an Execution Failure Displayed for a Node in the Log When the Node Status Is Successful?,Data", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Is an Execution Failure Displayed for a Node in the Log When the Node Status Is Successful?", @@ -8954,17 +9192,18 @@ "uri":"dataartsstudio_03_0408.html", "node_id":"dataartsstudio_03_0408.xml", "product_code":"dataartsstudio", - "code":"431", - "des":"DataArts Studio is a project-level service. Choose a project-level token.", + "code":"438", + "des":"An unknown exception occurs when I call a DataArts Factory API.DataArts Studio is a project-level service. Choose a project-level token.", "doc_type":"usermanual", "kw":"What Should I Do If an Unknown Exception Occurs When I Call a DataArts Factory API?,DataArts Factory", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If an Unknown Exception Occurs When I Call a DataArts Factory API?", @@ -8974,17 +9213,18 @@ "uri":"dataartsstudio_03_0409.html", "node_id":"dataartsstudio_03_0409.xml", "product_code":"dataartsstudio", - "code":"432", - "des":"The resource name can contain a maximum of 32 characters, including only letters, digits, underscores (_), and hyphens (-).", + "code":"439", + "des":"An error message indicating an invalid resource name is displayed when I call a resource creation API?The resource name can contain a maximum of 32 characters, including ", "doc_type":"usermanual", "kw":"Why Is an Error Message Indicating an Invalid Resource Name Is Displayed When I Call a Resource Crea", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Is an Error Message Indicating an Invalid Resource Name Is Displayed When I Call a Resource Creation API?", @@ -8994,17 +9234,18 @@ "uri":"dataartsstudio_03_0410.html", "node_id":"dataartsstudio_03_0410.xml", "product_code":"dataartsstudio", - "code":"433", - "des":"The PatchData task may contain jobs in other workspaces. You can check the statuses of the job instance of the PatchData task in other workspaces.", + "code":"440", + "des":"A PatchData task fails when all PatchData job instances are successful.The PatchData task may contain jobs in other workspaces. You can check the statuses of the job inst", "doc_type":"usermanual", "kw":"Why Does a PatchData Task Fail When All PatchData Job Instances Are Successful?,DataArts Factory,Use", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Does a PatchData Task Fail When All PatchData Job Instances Are Successful?", @@ -9014,17 +9255,18 @@ "uri":"dataartsstudio_03_0411.html", "node_id":"dataartsstudio_03_0411.xml", "product_code":"dataartsstudio", - "code":"434", - "des":"The table already exists, but you do not have permissions to view and edit it.", + "code":"441", + "des":"Role permissions are insufficient.The table already exists, but you do not have permissions to view and edit it.", "doc_type":"usermanual", "kw":"Why Is a Table Unavailable When an Error Message Indicating that the Table Already Exists Is Display", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"Why Is a Table Unavailable When an Error Message Indicating that the Table Already Exists Is Displayed During Table Creation from a DWS Data Connection?", @@ -9034,17 +9276,18 @@ "uri":"dataartsstudio_03_0415.html", "node_id":"dataartsstudio_03_0415.xml", "product_code":"dataartsstudio", - "code":"435", - "des":"The following figure shows the error.MRS APIs can be called by a single user for a maximum of 60 times per minute. Therefore, the solution is to call the API less frequen", + "code":"442", + "des":"Error message \"The throttling threshold has been reached: policy user over ratelimit,limit:60,time:1 minute\" is displayed when I schedule an MRS Spark job.MRS APIs can be", "doc_type":"usermanual", "kw":"What Should I Do If Error Message \"The throttling threshold has been reached: policy user over ratel", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Error Message \"The throttling threshold has been reached: policy user over ratelimit,limit:60,time:1 minute.\" Is Displayed When I Schedule an MRS Spark Job?", @@ -9054,17 +9297,18 @@ "uri":"dataartsstudio_03_0417.html", "node_id":"dataartsstudio_03_0417.xml", "product_code":"dataartsstudio", - "code":"436", + "code":"443", "des":"This error occurs when json.dumps(json_data, ensure_ascii=False) is configured in the Python script. The following figure shows the error.By default, DataArts Studio uses", "doc_type":"usermanual", "kw":"What Should I Do If Error Message \"UnicodeEncodeError: 'ascii' codec can't encode characters in posi", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Error Message \"UnicodeEncodeError: 'ascii' codec can't encode characters in position 63-64: ordinal not in range(128)\" Is Displayed When I Run a Python Script?", @@ -9074,17 +9318,18 @@ "uri":"dataartsstudio_03_0418.html", "node_id":"dataartsstudio_03_0418.xml", "product_code":"dataartsstudio", - "code":"437", + "code":"444", "des":"When you view the logs of a data development node, the error message shown in the following figure is displayed.Logs of data development jobs are stored in OBS buckets. T", "doc_type":"usermanual", "kw":"What Should I Do If an Error Message Is Displayed When I View Logs?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If an Error Message Is Displayed When I View Logs?", @@ -9094,17 +9339,18 @@ "uri":"dataartsstudio_03_0618.html", "node_id":"dataartsstudio_03_0618.xml", "product_code":"dataartsstudio", - "code":"438", + "code":"445", "des":"This section uses the Shell node as an example.The Shell node fails to be executed, but the Shell script is executed successfully.Obtain the run logs of the Shell node.[2", "doc_type":"usermanual", "kw":"What Should I Do If a Shell/Python Node Fails and Error \"session is down\" Is Reported?,DataArts Fact", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If a Shell/Python Node Fails and Error \"session is down\" Is Reported?", @@ -9114,17 +9360,18 @@ "uri":"dataartsstudio_03_0619.html", "node_id":"dataartsstudio_03_0619.xml", "product_code":"dataartsstudio", - "code":"439", + "code":"446", "des":"The Rest Client operator is used as an example.When configuring a parameter for a job operator, you need to enter the parameter name and value. If you already enter 512 c", "doc_type":"usermanual", "kw":"What Should I Do If a Parameter Value in a Request Header Contains More Than 512 Characters?,DataArt", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If a Parameter Value in a Request Header Contains More Than 512 Characters?", @@ -9134,17 +9381,18 @@ "uri":"dataartsstudio_03_0620.html", "node_id":"dataartsstudio_03_0620.xml", "product_code":"dataartsstudio", - "code":"440", - "des":"This issue is caused by the case of id.During the execution of a DWS SQL script, the system uses lowercase letters by default. If a field is in upper case, add \"\".Example", + "code":"447", + "des":"This issue is caused by the case of the ID.During the execution of a DWS SQL script, the system uses lowercase letters by default. If a field is in upper case, add \"\".Exa", "doc_type":"usermanual", "kw":"What Should I Do If a Message Is Displayed Indicating that the ID Does Not Exist During the Executio", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If a Message Is Displayed Indicating that the ID Does Not Exist During the Execution of a DWS SQL Script?", @@ -9154,17 +9402,18 @@ "uri":"dataartsstudio_03_0621.html", "node_id":"dataartsstudio_03_0621.xml", "product_code":"dataartsstudio", - "code":"441", - "des":"In the left navigation pane of DataArts Factory, choose MonitoringJob Monitoring.Click the Batch Job Monitoring tab.Query the scheduling and execution of the CDM job by f", + "code":"448", + "des":"Jobs that invoke a CDM jobIn the left navigation pane of DataArts Factory, choose MonitoringJob Monitoring.Click the Batch Job Monitoring tab.Query the scheduling and exe", "doc_type":"usermanual", "kw":"How Do I Check Which Jobs Invoke a CDM Job?,DataArts Factory,User Guide", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"How Do I Check Which Jobs Invoke a CDM Job?", @@ -9174,27 +9423,91 @@ "uri":"dataartsstudio_03_0623.html", "node_id":"dataartsstudio_03_0623.xml", "product_code":"dataartsstudio", - "code":"442", - "des":"Symptom:Error message \"The request parameter invalid\" is displayed when Python is used to call the API for executing scripts.Call the script execution API by following th", + "code":"449", + "des":"Error message \"The request parameter invalid\" is displayed when Python is used to call the API for executing scripts.Call the script execution API by following the instru", "doc_type":"usermanual", "kw":"What Should I Do If Error Message \"The request parameter invalid\" Is Displayed When I Use Python to ", "search_title":"", "metedata":[ { - "IsMulti":"no", + "prodname":"dataartsstudio", + "IsMulti":"no;No", "documenttype":"usermanual", - "IsBot":"yes", - "prodname":"dataartsstudio" + "IsBot":"yes;No;Yes", + "opensource":"false;true" } ], "title":"What Should I Do If Error Message \"The request parameter invalid\" Is Displayed When I Use Python to Call the API for Executing Scripts?", "githuburl":"" }, + { + "uri":"dataartsstudio_03_0628.html", + "node_id":"dataartsstudio_03_0628.xml", + "product_code":"dataartsstudio", + "code":"450", + "des":"The default queue of a new DLI SQL script has been deleted.When a DLI SQL script is used or opened, the queue selected for the script is stored in the cache. This queue i", + "doc_type":"usermanual", + "kw":"What Should I Do If the Default Queue of a New DLI SQL Script in DataArts Factory Has Been Deleted?,", + "search_title":"", + "metedata":[ + { + "prodname":"dataartsstudio", + "IsMulti":"no;No", + "documenttype":"usermanual", + "IsBot":"yes;No;Yes", + "opensource":"false;true" + } + ], + "title":"What Should I Do If the Default Queue of a New DLI SQL Script in DataArts Factory Has Been Deleted?", + "githuburl":"" + }, + { + "uri":"dataartsstudio_03_0629.html", + "node_id":"dataartsstudio_03_0629.xml", + "product_code":"dataartsstudio", + "code":"451", + "des":"During the configuration of a job in DataArts Factory, offline Kafka cannot be selected when Scheduling Type is set to Event-based and Event Type is set to KAFKA.Only MRS", + "doc_type":"usermanual", + "kw":"Does the Event-based Scheduling Type in DataArts Factory Support Offline Kafka?,DataArts Factory,Use", + "search_title":"", + "metedata":[ + { + "prodname":"dataartsstudio", + "IsMulti":"no;No", + "documenttype":"usermanual", + "IsBot":"yes;No;Yes", + "opensource":"false;true" + } + ], + "title":"Does the Event-based Scheduling Type in DataArts Factory Support Offline Kafka?", + "githuburl":"" + }, + { + "uri":"dataartsstudio_03_0630.html", + "node_id":"dataartsstudio_03_0630.xml", + "product_code":"dataartsstudio", + "code":"452", + "des":"Error messages:Failed to query the user who submits the job on MRS Manager. The error code is 0191.The current user does not exist on MRS Manager. Grant the user sufficie", + "doc_type":"usermanual", + "kw":"What Should I Do If an Error Is Reported When I Submit an MRS Job with an Agency Through an MRS Clus", + "search_title":"", + "metedata":[ + { + "prodname":"dataartsstudio", + "IsMulti":"no;No", + "documenttype":"usermanual", + "IsBot":"yes;No;Yes", + "opensource":"false;true" + } + ], + "title":"What Should I Do If an Error Is Reported When I Submit an MRS Job with an Agency Through an MRS Cluster Connected Using an MRS API or the MRS Tenant Plane?", + "githuburl":"" + }, { "uri":"dataartsstudio_12_0010.html", "node_id":"dataartsstudio_12_0010.xml", "product_code":"dataartsstudio", - "code":"443", + "code":"453", "des":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "doc_type":"usermanual", "kw":"Change History,User Guide", diff --git a/docs/dataartsstudio/umn/CLASS.TXT.json b/docs/dataartsstudio/umn/CLASS.TXT.json index 98257c886..c94007296 100644 --- a/docs/dataartsstudio/umn/CLASS.TXT.json +++ b/docs/dataartsstudio/umn/CLASS.TXT.json @@ -72,7 +72,7 @@ "code":"8" }, { - "desc":"The following table lists the recommended browser for logging in to DataArts Studio.Browser compatibilityBrowserRecommended VersionRecommended OSRemarksGoogle Chrome115, ", + "desc":"The following table lists the recommended browser for logging in to DataArts Studio.Browser compatibilityBrowserRecommended VersionRecommended OSRemarksGoogle Chrome133, ", "product_code":"dataartsstudio", "title":"Notes and Constraints", "uri":"dataartsstudio_07_006.html", @@ -92,83 +92,200 @@ { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Preparations", - "uri":"dataartsstudio_12_0002.html", + "title":"User Guide", + "uri":"dataartsstudio_12_0004.html", "doc_type":"usermanual", "p_code":"", "code":"11" }, { - "desc":"Before using DataArts Studio, you need to create a a cloud platform account, create a DataArts Studio instance, access the DataArts Studio instance console, manage worksp", + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Preparations", - "uri":"dataartsstudio_01_0003.html", + "title":"Creating and Configuring a DataArts Studio Instance", + "uri":"dataartsstudio_01_1028.html", "doc_type":"usermanual", "p_code":"11", "code":"12" }, { - "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "desc":"Only users with DARTSAdministrator or Tenant Administrator permissions can create DataArts Studio instances or incremental packages.Users with Tenant Administrator permis", "product_code":"dataartsstudio", - "title":"Creating DataArts Studio Instances", - "uri":"dataartsstudio_01_1028.html", + "title":"Creating a DataArts Studio Instance", + "uri":"dataartsstudio_01_0115.html", "doc_type":"usermanual", - "p_code":"11", + "p_code":"12", "code":"13" }, { - "desc":"Only users who have the DARTS Administrator or Tenant Administrator permissions can create DataArts Studio instances or DataArts Studio incremental packages. To allow use", + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Creating a DataArts Studio Basic Package", - "uri":"dataartsstudio_01_0115.html", + "title":"Creating a DataArts Studio Incremental Package", + "uri":"dataartsstudio_01_0138.html", "doc_type":"usermanual", - "p_code":"13", + "p_code":"12", "code":"14" }, { - "desc":"DataArts Studio provides basic and incremental packages. If the basic package cannot meet your requirements, you can create an incremental package. Before you create an i", + "desc":"DataArts Studio provides basic and incremental packages. If the basic package cannot meet your demands, you need to create an incremental package.Table 1 lists the increm", "product_code":"dataartsstudio", - "title":"(Optional) Creating a DataArts Studio Incremental Package", - "uri":"dataartsstudio_01_0119.html", + "title":"Introduction to Incremental Packages", + "uri":"dataartsstudio_01_0139.html", "doc_type":"usermanual", - "p_code":"13", + "p_code":"14", "code":"15" }, { - "desc":"A DataArts Studio instance has been obtained. For details, see Creating a DataArts Studio Basic Package.If there are multiple DataArts Studio instances in the current reg", + "desc":"A DataArts Migration (that is, CDM) incremental package provides resources for a CDM cluster. When you create a CDM incremental package, the system automatically creates ", + "product_code":"dataartsstudio", + "title":"Creating a DataArts Migration Incremental Package", + "uri":"dataartsstudio_01_0119.html", + "doc_type":"usermanual", + "p_code":"14", + "code":"16" + }, + { + "desc":"This type of incremental package provides resource groups for real-time jobs in DataArts Migration. DataArts Migration resource groups can be used to migrate data to the ", + "product_code":"dataartsstudio", + "title":"Creating a DataArts Migration Resource Group Incremental Package", + "uri":"dataartsstudio_01_0145.html", + "doc_type":"usermanual", + "p_code":"14", + "code":"17" + }, + { + "desc":"You have obtained a DataArts Studio instance. For details, see Creating a DataArts Studio Instance.If there are multiple DataArts Studio instances in the current region, ", "product_code":"dataartsstudio", "title":"Accessing the DataArts Studio Instance Console", "uri":"dataartsstudio_01_0001.html", "doc_type":"usermanual", - "p_code":"11", - "code":"16" + "p_code":"12", + "code":"18" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Managing a Workspace", - "uri":"dataartsstudio_01_0011.html", + "title":"Creating and Configuring a Workspace in Simple Mode", + "uri":"dataartsstudio_01_0134.html", "doc_type":"usermanual", - "p_code":"11", - "code":"17" + "p_code":"12", + "code":"19" }, { - "desc":"The system will create a default workspace and assign the admin role to you after you create a DataArts Studio instance. can use the default workspace or create a new wor", + "desc":"The system creates a default workspace named default for the DataArts Studio instance you create and assigns administrator permissions to you. You can use the default wor", "product_code":"dataartsstudio", - "title":"Creating and Managing a Workspace", + "title":"Creating a Workspace in Simple Mode", "uri":"dataartsstudio_01_0116.html", "doc_type":"usermanual", - "p_code":"17", - "code":"18" + "p_code":"19", + "code":"20" }, { - "desc":"By default, job logs and DLI dirty data are stored in an OBS bucket named dlf-log-{project ID}. You can customize a log storage path. You can configure an OBS bucket glob", + "desc":"By default, job logs and DLI dirty data are stored in an OBS bucket named dlf-log-{project ID}. You can customize a storage path for logs and one for DLI dirty data. You ", "product_code":"dataartsstudio", "title":"(Optional) Changing the Job Log Storage Path", "uri":"dataartsstudio_01_0530.html", "doc_type":"usermanual", - "p_code":"17", - "code":"19" + "p_code":"19", + "code":"21" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"(Optional) Creating and Using a Workspace in Enterprise Mode", + "uri":"dataartsstudio_01_5098.html", + "doc_type":"usermanual", + "p_code":"12", + "code":"22" + }, + { + "desc":"DataArts Studio provides two workspace modes, the simplified mode and enterprise mode, to help you manage your production data with varied security control requirements. ", + "product_code":"dataartsstudio", + "title":"Introduction to the Enterprise Mode", + "uri":"dataartsstudio_01_5099.html", + "doc_type":"usermanual", + "p_code":"22", + "code":"23" + }, + { + "desc":"If you are using a workspace in simple mode and want to isolate the development and production environments, you can upgrade the workspace to one in enterprise mode. If y", + "product_code":"dataartsstudio", + "title":"Creating a Workspace in Enterprise Mode", + "uri":"dataartsstudio_01_5135.html", + "doc_type":"usermanual", + "p_code":"22", + "code":"24" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"Operations Supported for Different Roles in Enterprise Mode", + "uri":"dataartsstudio_01_5106.html", + "doc_type":"usermanual", + "p_code":"22", + "code":"25" + }, + { + "desc":"The DataArts Studio enterprise mode mainly involves the Management Center and DataArts Factory components. The service process is completed by the admin, developer, deplo", + "product_code":"dataartsstudio", + "title":"Service Process in Enterprise Mode", + "uri":"dataartsstudio_01_5100.html", + "doc_type":"usermanual", + "p_code":"25", + "code":"26" + }, + { + "desc":"As the project owner or development owner, the admin manages the environment configuration and personnel roles in enterprise mode in a unified manner. The following table", + "product_code":"dataartsstudio", + "title":"Admin Operations", + "uri":"dataartsstudio_01_5101.html", + "doc_type":"usermanual", + "p_code":"25", + "code":"27" + }, + { + "desc":"The developer develops scripts and jobs. The following table describes related operations.", + "product_code":"dataartsstudio", + "title":"Developer Operations", + "uri":"dataartsstudio_01_5102.html", + "doc_type":"usermanual", + "p_code":"25", + "code":"28" + }, + { + "desc":"The deployer reviews the tasks to be released. This section describes related operations.The deployer reviews the release tasks submitted by the developer. Modified jobs ", + "product_code":"dataartsstudio", + "title":"Deployer Operations", + "uri":"dataartsstudio_01_5103.html", + "doc_type":"usermanual", + "p_code":"25", + "code":"29" + }, + { + "desc":"The operator manages the jobs, instances, notifications, and backups in the production environment in a unified manner. The following table describes related operations.", + "product_code":"dataartsstudio", + "title":"Operator Operations", + "uri":"dataartsstudio_01_5104.html", + "doc_type":"usermanual", + "p_code":"25", + "code":"30" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"Managing DataArts Studio Resources", + "uri":"dataartsstudio_01_4105.html", + "doc_type":"usermanual", + "p_code":"12", + "code":"31" + }, + { + "desc":"Before creating a real-time data migration job, you need to associate the data migration resource group with a DataArts Studio workspace so that you can select a specifie", + "product_code":"dataartsstudio", + "title":"Associating a Real-Time Migration Resource Group with Workspaces", + "uri":"dataartsstudio_01_7587.html", + "doc_type":"usermanual", + "p_code":"31", + "code":"32" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -177,7 +294,7 @@ "uri":"dataartsstudio_01_0118.html", "doc_type":"usermanual", "p_code":"11", - "code":"20" + "code":"33" }, { "desc":"Identity and Access Management (IAM) can be used for fine-grained permissions management on your DataArts Studio resources. With IAM, you can:Create IAM users for employe", @@ -185,350 +302,278 @@ "title":"Creating an IAM User and Assigning DataArts Studio Permissions", "uri":"dataartsstudio_01_0004.html", "doc_type":"usermanual", - "p_code":"20", - "code":"21" - }, - { - "desc":"For IAM users with the DARTS User permission, a workspace role determines their permissions in the workspace. Currently, five preset roles are available: admin, developer", - "product_code":"dataartsstudio", - "title":"(Optional) Defining a Workspace Role", - "uri":"dataartsstudio_01_0120.html", - "doc_type":"usermanual", - "p_code":"20", - "code":"22" - }, - { - "desc":"For IAM users with the DARTS User permission, a workspace role determines their permissions in the workspace. If you want to allow another IAM user with the DARTS User pe", - "product_code":"dataartsstudio", - "title":"Adding a Member and Assigning a Role", - "uri":"dataartsstudio_01_0117.html", - "doc_type":"usermanual", - "p_code":"20", - "code":"23" - }, - { - "desc":"When using DataArts Studio, for example, when creating OBS links, calling APIs, or locating issues, you may need to obtain information such as access keys, project IDs, a", - "product_code":"dataartsstudio", - "title":"(Optional) Obtaining Authentication Information", - "uri":"dataartsstudio_01_0006.html", - "doc_type":"usermanual", - "p_code":"11", - "code":"24" - }, - { - "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "product_code":"dataartsstudio", - "title":"User Guide", - "uri":"dataartsstudio_12_0004.html", - "doc_type":"usermanual", - "p_code":"", - "code":"25" - }, - { - "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "product_code":"dataartsstudio", - "title":"Management Console", - "uri":"en-us_topic_0000002270846046.html", - "doc_type":"usermanual", - "p_code":"25", - "code":"26" - }, - { - "desc":"A tag is a key-value pair that identifies an instance. It consists of a key and a value.DataArts Studio instance tags can be used in the following scenarios:If there are ", - "product_code":"dataartsstudio", - "title":"Tags", - "uri":"en-us_topic_0000002270788944.html", - "doc_type":"usermanual", - "p_code":"26", - "code":"27" - }, - { - "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "product_code":"dataartsstudio", - "title":"Enterprise Mode", - "uri":"dataartsstudio_01_5098.html", - "doc_type":"usermanual", - "p_code":"26", - "code":"28" - }, - { - "desc":"DataArts Studio provides two workspace modes, the simplified mode and enterprise mode, to help you manage your production data with varied security control requirements. ", - "product_code":"dataartsstudio", - "title":"DataArts Studio Enterprise Mode Overview", - "uri":"dataartsstudio_01_5099.html", - "doc_type":"usermanual", - "p_code":"28", - "code":"29" - }, - { - "desc":"The DataArts Studio enterprise mode mainly involves the Management Center and DataArts Factory components. The service process is completed by the admin, developer, deplo", - "product_code":"dataartsstudio", - "title":"Service Process in Enterprise Mode", - "uri":"dataartsstudio_01_5100.html", - "doc_type":"usermanual", - "p_code":"28", - "code":"30" - }, - { - "desc":"If you are using a workspace in simple mode and want to isolate the development and production environments, you can upgrade the workspace to one in enterprise mode. If y", - "product_code":"dataartsstudio", - "title":"Creating a Workspace in Enterprise Mode", - "uri":"dataartsstudio_01_5135.html", - "doc_type":"usermanual", - "p_code":"28", - "code":"31" - }, - { - "desc":"As the project owner or development owner, the admin manages the environment configuration and personnel roles in enterprise mode in a unified manner. The following table", - "product_code":"dataartsstudio", - "title":"Admin Operations", - "uri":"dataartsstudio_01_5101.html", - "doc_type":"usermanual", - "p_code":"28", - "code":"32" - }, - { - "desc":"The developer develops scripts and jobs. The following table describes related operations.", - "product_code":"dataartsstudio", - "title":"Developer Operations", - "uri":"dataartsstudio_01_5102.html", - "doc_type":"usermanual", - "p_code":"28", - "code":"33" - }, - { - "desc":"The deployer reviews the tasks to be released. This section describes related operations.The deployer reviews the release tasks submitted by the developer. Modified jobs ", - "product_code":"dataartsstudio", - "title":"Deployer Operations", - "uri":"dataartsstudio_01_5103.html", - "doc_type":"usermanual", - "p_code":"28", + "p_code":"33", "code":"34" }, { - "desc":"The operator manages the jobs, instances, notifications, and backups in the production environment in a unified manner. The following table describes related operations.", + "desc":"For IAM users with DARTS User account permissions, DataArts Studio workspace roles determine their permissions in workspaces. Preset roles include admin, developer, deplo", "product_code":"dataartsstudio", - "title":"Operator Operations", - "uri":"dataartsstudio_01_5104.html", + "title":"(Optional) Defining a Workspace Role", + "uri":"dataartsstudio_01_0107.html", "doc_type":"usermanual", - "p_code":"28", + "p_code":"33", "code":"35" }, + { + "desc":"For IAM users with DARTS User account permissions, their permissions in a DataArts Studio workspace are determined by workspace roles. If you want to share a DataArts Stu", + "product_code":"dataartsstudio", + "title":"Adding Workspace Members and Assigning Roles", + "uri":"dataartsstudio_01_0117.html", + "doc_type":"usermanual", + "p_code":"33", + "code":"36" + }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", "title":"Management Center", "uri":"dataartsstudio_01_0008.html", "doc_type":"usermanual", - "p_code":"25", - "code":"36" - }, - { - "desc":"Before using DataArts Studio, you need to select cloud services or databases as the data lake foundation, which provides storage and compute capabilities. DataArts Studio", - "product_code":"dataartsstudio", - "title":"Data Sources", - "uri":"dataartsstudio_01_0005_0.html", - "doc_type":"usermanual", - "p_code":"36", + "p_code":"11", "code":"37" }, { - "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "desc":"Before using DataArts Studio, you need to select cloud services or databases as the data foundation, which provides storage and compute capabilities. DataArts Studio prov", "product_code":"dataartsstudio", - "title":"Managing Data Connections", - "uri":"dataartsstudio_01_0009.html", + "title":"Data Sources Supported by DataArts Studio", + "uri":"dataartsstudio_01_0005.html", "doc_type":"usermanual", - "p_code":"36", + "p_code":"37", "code":"38" }, { "desc":"You can create data connections by configuring data sources. Based on the data connections of the Management Center, DataArts Studio performs data development, governance", "product_code":"dataartsstudio", - "title":"Creating a Data Connection", + "title":"Creating a DataArts Studio Data Connection", "uri":"dataartsstudio_01_1299.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"37", "code":"39" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Configuring a DWS Connection", - "uri":"dataartsstudio_01_1300.html", + "title":"Configuring DataArts Studio Data Connection Parameters", + "uri":"dataartsstudio_01_0009.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"37", "code":"40" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Configuring a DLI Connection", - "uri":"dataartsstudio_01_1301.html", + "title":"DWS Connection Parameters", + "uri":"dataartsstudio_01_1300.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"41" }, { - "desc":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Configuring an MRS Hive Connection", - "uri":"dataartsstudio_01_1306.html", + "title":"DLI Connection Parameters", + "uri":"dataartsstudio_01_1301.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"42" }, { "desc":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "product_code":"dataartsstudio", - "title":"Configuring an MRS HBase Connection", - "uri":"dataartsstudio_01_1307.html", + "title":"MRS Hive Connection Parameters", + "uri":"dataartsstudio_01_1306.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"43" }, { "desc":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "product_code":"dataartsstudio", - "title":"Configuring an MRS Kafka Connection", - "uri":"dataartsstudio_01_1308.html", + "title":"MRS HBase Connection Parameters", + "uri":"dataartsstudio_01_1307.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"44" }, { "desc":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "product_code":"dataartsstudio", - "title":"Configuring an MRS Spark Connection", - "uri":"dataartsstudio_01_1314.html", + "title":"MRS Kafka Connection Parameters", + "uri":"dataartsstudio_01_1308.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"45" }, { "desc":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "product_code":"dataartsstudio", - "title":"Configuring an MRS ClickHouse Connection", - "uri":"dataartsstudio_01_1309.html", + "title":"MRS Spark Connection Parameters", + "uri":"dataartsstudio_01_1314.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"46" }, { "desc":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "product_code":"dataartsstudio", - "title":"Configuring an MRS Hetu Connection", - "uri":"dataartsstudio_01_1310.html", + "title":"MRS ClickHouse Connection Parameters", + "uri":"dataartsstudio_01_1309.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"47" }, { "desc":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "product_code":"dataartsstudio", - "title":"Configuring an MRS Impala Connection", - "uri":"dataartsstudio_01_1311.html", + "title":"MRS Hetu Connection Parameters", + "uri":"dataartsstudio_01_1310.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"48" }, { "desc":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "product_code":"dataartsstudio", - "title":"Configuring an MRS Doris Connection", - "uri":"dataartsstudio_01_1390.html", + "title":"MRS Impala Connection Parameters", + "uri":"dataartsstudio_01_1311.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"49" }, { - "desc":"You can create connections to RDS databases including MySQL, PostgreSQL, SQL Server, SAP HANA, and DM databases.", + "desc":"To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authenticatio", "product_code":"dataartsstudio", - "title":"Configuring an RDS Connection", - "uri":"dataartsstudio_01_1303.html", + "title":"Doris Connection Parameters", + "uri":"dataartsstudio_01_1390.html", "doc_type":"usermanual", - "p_code":"38", + "p_code":"40", "code":"50" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Configuring an Oracle Connection", + "title":"OpenSource ClickHouse Connection Parameters", + "uri":"dataartsstudio_01_1321.html", + "doc_type":"usermanual", + "p_code":"40", + "code":"51" + }, + { + "desc":"RDS connections can be used to connect to MySQL, PostgreSQL, and SQL Server databases.", + "product_code":"dataartsstudio", + "title":"RDS Connection Parameters", + "uri":"dataartsstudio_01_1303.html", + "doc_type":"usermanual", + "p_code":"40", + "code":"52" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"Oracle Connection Parameters", "uri":"dataartsstudio_01_1302.html", "doc_type":"usermanual", - "p_code":"38", - "code":"51" + "p_code":"40", + "code":"53" }, { "desc":"The maximum number of shell or Python scripts that can run concurrently on the ECS is determined by the value of MaxSessions in the /etc/ssh/sshd_config file on the ECS. ", "product_code":"dataartsstudio", - "title":"Configuring a Host Connection", + "title":"Host Connection Parameters", "uri":"dataartsstudio_01_1305.html", "doc_type":"usermanual", - "p_code":"38", - "code":"52" - }, - { - "desc":"To migrate resources in one workspace to another, you can use the resource migration function provided by DataArts Studio.Resources that can be migrated include the data ", - "product_code":"dataartsstudio", - "title":"Migrating Resources", - "uri":"dataartsstudio_01_0010.html", - "doc_type":"usermanual", - "p_code":"36", - "code":"53" - }, - { - "desc":"You can configure isolation between the development and production environments for DLI and DB.After the environment isolation is configured, the data connection in the d", - "product_code":"dataartsstudio", - "title":"Configuring Environment Isolation for a Workspace in Enterprise Mode", - "uri":"dataartsstudio_01_5105.html", - "doc_type":"usermanual", - "p_code":"36", + "p_code":"40", "code":"54" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Tutorials", - "uri":"dataartsstudio_01_0350.html", + "title":"Rest Client Connection Parameters", + "uri":"dataartsstudio_01_1620.html", "doc_type":"usermanual", - "p_code":"36", + "p_code":"40", "code":"55" }, - { - "desc":"This section describes how to create an MRS Hive connection between DataArts Studio and the data lake base.You have created a data lake to connect, for example, a databas", - "product_code":"dataartsstudio", - "title":"Creating an MRS Hive Connection", - "uri":"dataartsstudio_01_0351.html", - "doc_type":"usermanual", - "p_code":"55", - "code":"56" - }, - { - "desc":"This section describes how to create a DWS connection between DataArts Studio and the data lake base.You have created a data lake to connect, for example, a database or c", - "product_code":"dataartsstudio", - "title":"Creating a DWS Connection", - "uri":"dataartsstudio_01_0352.html", - "doc_type":"usermanual", - "p_code":"55", - "code":"57" - }, - { - "desc":"This section describes how to create a MySQL connection between DataArts Studio and the data lake base.You have created a data lake to connect, for example, a database or", - "product_code":"dataartsstudio", - "title":"Creating a MySQL Connection", - "uri":"dataartsstudio_01_0353.html", - "doc_type":"usermanual", - "p_code":"55", - "code":"58" - }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"DataArts Migration", + "title":"Redis Connection Parameters", + "uri":"dataartsstudio_01_1509.html", + "doc_type":"usermanual", + "p_code":"40", + "code":"56" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"SAP HANA Connection Parameters", + "uri":"dataartsstudio_01_1510.html", + "doc_type":"usermanual", + "p_code":"40", + "code":"57" + }, + { + "desc":"To migrate resources in one workspace to another, you can use the resource migration function provided by DataArts Studio.Resources can be imported from OBS or a local pa", + "product_code":"dataartsstudio", + "title":"Configuring DataArts Studio Resource Migration", + "uri":"dataartsstudio_01_0010.html", + "doc_type":"usermanual", + "p_code":"37", + "code":"58" + }, + { + "desc":"You can configure isolation between the development and production environments for DLI and DB.After the environment isolation is configured, the data connection in the d", + "product_code":"dataartsstudio", + "title":"Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode", + "uri":"dataartsstudio_01_5105.html", + "doc_type":"usermanual", + "p_code":"37", + "code":"59" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"Typical Scenarios for Using Management Center", + "uri":"dataartsstudio_01_0350.html", + "doc_type":"usermanual", + "p_code":"37", + "code":"60" + }, + { + "desc":"This section describes how to create an MRS Hive connection between DataArts Studio and the data lake base.You have created a data lake to connect, for example, a databas", + "product_code":"dataartsstudio", + "title":"Creating a Connection Between DataArts Studio and an MRS Hive Data Lake", + "uri":"dataartsstudio_01_0351.html", + "doc_type":"usermanual", + "p_code":"60", + "code":"61" + }, + { + "desc":"This section describes how to create a DWS connection between DataArts Studio and the data lake base.You have created a data lake to connect, for example, a database or c", + "product_code":"dataartsstudio", + "title":"Creating a Connection Between DataArts Studio and a GaussDB(DWS) Data Lake", + "uri":"dataartsstudio_01_0352.html", + "doc_type":"usermanual", + "p_code":"60", + "code":"62" + }, + { + "desc":"This section describes how to create a MySQL connection between DataArts Studio and the data lake base.You have created a data lake to connect, for example, a database or", + "product_code":"dataartsstudio", + "title":"Creating a Connection Between DataArts Studio and a MySQL Database", + "uri":"dataartsstudio_01_0353.html", + "doc_type":"usermanual", + "p_code":"60", + "code":"63" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"DataArts Migration (CDM Jobs)", "uri":"dataartsstudio_01_0012.html", "doc_type":"usermanual", - "p_code":"25", - "code":"59" + "p_code":"11", + "code":"64" }, { "desc":"DataArts Migration is an efficient and easy-to-use data integration service. Based on the big data migration to the cloud and intelligent data lake solutions, CDM provide", @@ -536,17 +581,17 @@ "title":"Overview", "uri":"dataartsstudio_01_0013.html", "doc_type":"usermanual", - "p_code":"59", - "code":"60" + "p_code":"64", + "code":"65" }, { - "desc":"You cannot modify the flavor of an existing cluster. If you require a higher flavor, create a cluster with your desired flavor.Arm CDM clusters do not support agents. The", + "desc":"You cannot modify the flavor of an existing cluster. If you require a higher flavor, create a cluster with your desired flavor.The CDM cluster version (Arm or x86) is det", "product_code":"dataartsstudio", - "title":"Constraints", + "title":"Notes and Constraints", "uri":"dataartsstudio_01_0015.html", "doc_type":"usermanual", - "p_code":"59", - "code":"61" + "p_code":"64", + "code":"66" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -554,8 +599,8 @@ "title":"Supported Data Sources", "uri":"dataartsstudio_01_0215.html", "doc_type":"usermanual", - "p_code":"59", - "code":"62" + "p_code":"64", + "code":"67" }, { "desc":"CDM provides the following migration modes which support different data sources:Table/File migration in the import of data into a data lake or migration of data to the cl", @@ -563,17 +608,8 @@ "title":"Supported Data Sources (2.10.0.300)", "uri":"dataartsstudio_01_0196.html", "doc_type":"usermanual", - "p_code":"62", - "code":"63" - }, - { - "desc":"CDM provides the following migration modes which support different data sources:Table/File migration in the import of data into a data lake or migration of data to the cl", - "product_code":"dataartsstudio", - "title":"Supported Data Sources (2.10.0.100)", - "uri":"dataartsstudio_01_0197.html", - "doc_type":"usermanual", - "p_code":"62", - "code":"64" + "p_code":"67", + "code":"68" }, { "desc":"CDM provides the following migration modes which support different data sources:Table/File migration in the import of data into a data lake or migration of data to the cl", @@ -581,8 +617,8 @@ "title":"Supported Data Sources (2.9.3.300)", "uri":"dataartsstudio_01_0014.html", "doc_type":"usermanual", - "p_code":"62", - "code":"65" + "p_code":"67", + "code":"69" }, { "desc":"CDM provides the following migration modes which support different data sources:Table/File migration in the import of data into a data lake or migration of data to the cl", @@ -590,8 +626,8 @@ "title":"Supported Data Sources (2.9.2.200)", "uri":"dataartsstudio_01_0816.html", "doc_type":"usermanual", - "p_code":"62", - "code":"66" + "p_code":"67", + "code":"70" }, { "desc":"To ensure that data is completely imported to the migration destination, correctly configure field mappings based on data types supported for different data sources. For ", @@ -599,17 +635,17 @@ "title":"Supported Data Types", "uri":"dataartsstudio_01_0224.html", "doc_type":"usermanual", - "p_code":"62", - "code":"67" + "p_code":"67", + "code":"71" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Managing Clusters", + "title":"Creating and Managing a CDM Cluster", "uri":"dataartsstudio_01_0017.html", "doc_type":"usermanual", - "p_code":"59", - "code":"68" + "p_code":"64", + "code":"72" }, { "desc":"CDM provides independent clusters for secure and reliable data migration. Clusters are isolated from each other and cannot access each other.CDM clusters can be used in t", @@ -617,62 +653,62 @@ "title":"Creating a CDM Cluster", "uri":"dataartsstudio_01_0576.html", "doc_type":"usermanual", - "p_code":"68", - "code":"69" + "p_code":"72", + "code":"73" }, { "desc":"After creating a CDM cluster, you can bind an EIP to or unbind an EIP from the cluster.If CDM needs to access a local or Internet data source, or a cloud service in anoth", "product_code":"dataartsstudio", "title":"Binding or Unbinding an EIP", - "uri":"dataartsstudio_01_0020_0.html", + "uri":"dataartsstudio_01_0586.html", "doc_type":"usermanual", - "p_code":"68", - "code":"70" + "p_code":"72", + "code":"74" }, { - "desc":"After modifying some configurations (for example, disabling user isolation), you must restart the cluster to make the modification take effect.You have created a CDM clus", + "desc":"After modifying some configurations (for example, disabling user isolation), you must restart the cluster to make the modification take effect.If you restart a CDM cluste", "product_code":"dataartsstudio", - "title":"Restarting a Cluster", + "title":"Restarting a CDM Cluster", "uri":"dataartsstudio_01_0578.html", "doc_type":"usermanual", - "p_code":"68", - "code":"71" + "p_code":"72", + "code":"75" }, { "desc":"You can delete a CDM cluster that you no longer use.After a CDM cluster is deleted, the cluster and its data are destroyed and cannot be restored. Exercise caution when p", "product_code":"dataartsstudio", - "title":"Deleting a Cluster", + "title":"Deleting a CDM Cluster", "uri":"dataartsstudio_01_0579.html", "doc_type":"usermanual", - "p_code":"68", - "code":"72" + "p_code":"72", + "code":"76" }, { "desc":"This section describes how to obtain cluster logs to view the job running history and locate job failure causes.You have created a CDM cluster.", "product_code":"dataartsstudio", - "title":"Downloading Cluster Logs", + "title":"Downloading CDM Cluster Logs", "uri":"dataartsstudio_01_0022.html", "doc_type":"usermanual", - "p_code":"68", - "code":"73" + "p_code":"72", + "code":"77" }, { - "desc":"After creating a CDM cluster, you can view its basic information and modify its configurations.You can view the following basic cluster information:Cluster information: c", + "desc":"After creating a CDM cluster, you can view its basic information and modify its configurations.You can view the following basic cluster information:Cluster Information: c", "product_code":"dataartsstudio", - "title":"Viewing Basic Cluster Information and Modifying Cluster Configurations", - "uri":"dataartsstudio_01_0021_0.html", + "title":"Viewing and Modifying CDM Cluster Configurations", + "uri":"dataartsstudio_01_0587.html", "doc_type":"usermanual", - "p_code":"68", - "code":"74" + "p_code":"72", + "code":"78" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Viewing Metrics", + "title":"Managing and Viewing CDM Metrics", "uri":"dataartsstudio_01_0121.html", "doc_type":"usermanual", - "p_code":"68", - "code":"75" + "p_code":"72", + "code":"79" }, { "desc":"Cloud Eye monitors the running status of cloud services and usage of each metric, and creates alarm rules for monitoring metrics.After you create a CDM cluster, Cloud Eye", @@ -680,314 +716,323 @@ "title":"CDM Metrics", "uri":"dataartsstudio_01_0122.html", "doc_type":"usermanual", - "p_code":"75", - "code":"76" - }, - { - "desc":"Set the alarm rules to customize the monitored objects and notification policies. Then, learn CDM running status in a timely manner.A CDM alarm rule includes the alarm ru", - "product_code":"dataartsstudio", - "title":"Configuring Alarm Rules", - "uri":"dataartsstudio_01_0123.html", - "doc_type":"usermanual", - "p_code":"75", - "code":"77" - }, - { - "desc":"You can use Cloud Eye to monitor the running status of a CDM cluster. You can view the monitoring metrics on the Cloud Eye console.Monitored data takes some time for tran", - "product_code":"dataartsstudio", - "title":"Querying Metrics", - "uri":"dataartsstudio_01_0124.html", - "doc_type":"usermanual", - "p_code":"75", - "code":"78" - }, - { - "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "product_code":"dataartsstudio", - "title":"Managing Links", - "uri":"dataartsstudio_01_0023.html", - "doc_type":"usermanual", - "p_code":"59", - "code":"79" - }, - { - "desc":"Before creating a data migration job, create a link to enable the CDM cluster to read data from and write data to a data source. A migration job requires a source link an", - "product_code":"dataartsstudio", - "title":"Creating Links", - "uri":"dataartsstudio_01_0024.html", - "doc_type":"usermanual", "p_code":"79", "code":"80" }, { - "desc":"The Java Database Connectivity (JDBC) provides programmatic access to relational databases. Applications can execute SQL statements and retrieve data using the JDBC API.B", + "desc":"Set the alarm rules to customize the monitored objects and notification policies. Then, learn CDM running status in a timely manner.A CDM alarm rule includes the alarm ru", "product_code":"dataartsstudio", - "title":"Managing Drivers", - "uri":"dataartsstudio_01_0132.html", + "title":"Configuring CDM Alarm Rules", + "uri":"dataartsstudio_01_0123.html", "doc_type":"usermanual", "p_code":"79", "code":"81" }, { - "desc":"If your data is stored in HDFS or a relational database, you can deploy an agent on the source network. CDM pulls data from your internal data sources through an agent bu", + "desc":"You can use Cloud Eye to monitor the running status of a CDM cluster. You can view the monitoring metrics on the Cloud Eye console.Monitored data takes some time for tran", "product_code":"dataartsstudio", - "title":"Managing Agents", - "uri":"dataartsstudio_01_0128.html", + "title":"Querying CDM Metrics", + "uri":"dataartsstudio_01_0124.html", "doc_type":"usermanual", "p_code":"79", "code":"82" }, { - "desc":"On the Cluster Configurations page, you can create, edit, or delete Hadoop cluster configurations.When creating a Hadoop link, the Hadoop cluster configurations can simpl", + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Managing Cluster Configurations", - "uri":"dataartsstudio_01_1096.html", + "title":"Creating a Link in a CDM Cluster", + "uri":"dataartsstudio_01_0023.html", "doc_type":"usermanual", - "p_code":"79", + "p_code":"64", "code":"83" }, { - "desc":"When connecting CDM to the destination OBS bucket, you need to add the read and write permissions to the destination OBS bucket, and file authentication is not required.I", + "desc":"Before creating a data migration job, create a link to enable the CDM cluster to read data from and write data to a data source. A migration job requires a source link an", "product_code":"dataartsstudio", - "title":"Link to OBS", - "uri":"dataartsstudio_01_0045.html", + "title":"Creating a Link Between CDM and a Data Source", + "uri":"dataartsstudio_01_0024.html", "doc_type":"usermanual", - "p_code":"79", + "p_code":"83", "code":"84" }, - { - "desc":"Table 1 lists the parameters for creating a link to PostgreSQL/SQLServer.Do not change the password or user when the job is running. If you do so, the password will not t", - "product_code":"dataartsstudio", - "title":"Link to PostgreSQL/SQLServer", - "uri":"dataartsstudio_01_0044.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"85" - }, - { - "desc":"Table 1 describes the DWS link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the ", - "product_code":"dataartsstudio", - "title":"Link to DWS", - "uri":"dataartsstudio_01_0226.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"86" - }, - { - "desc":"Table 1 lists the parameters for a link to a MySQL database.Do not change the password or user when the job is running. If you do so, the password will not take effect im", - "product_code":"dataartsstudio", - "title":"Link to an RDS for MySQL/MySQL Database", - "uri":"dataartsstudio_01_1211.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"87" - }, - { - "desc":"Table 1 lists the parameters for a link to an Oracle database.Do not change the password or user when the job is running. If you do so, the password will not take effect ", - "product_code":"dataartsstudio", - "title":"Link to an Oracle Database", - "uri":"dataartsstudio_01_1212.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"88" - }, - { - "desc":"When connecting CDM to DLI, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the password will n", - "product_code":"dataartsstudio", - "title":"Link to DLI", - "uri":"dataartsstudio_01_0036.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"89" - }, - { - "desc":"CDM supports the following Hive data sources:MRS HiveFusionInsight HiveApache HiveDo not change the password or user when the job is running. If you do so, the password w", - "product_code":"dataartsstudio", - "title":"Link to Hive", - "uri":"dataartsstudio_01_0026.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"90" - }, - { - "desc":"CDM supports the following HBase data sources:MRS HBaseFusionInsight HBaseApache HBaseDo not change the password or user when the job is running. If you do so, the passwo", - "product_code":"dataartsstudio", - "title":"Link to HBase", - "uri":"dataartsstudio_01_0039.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"91" - }, - { - "desc":"CDM supports the following HDFS data sources:MRS HDFSFusionInsight HDFSApache HDFSDo not change the password or user when the job is running. If you do so, the password w", - "product_code":"dataartsstudio", - "title":"Link to HDFS", - "uri":"dataartsstudio_01_0040.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"92" - }, - { - "desc":"The FTP/SFTP link is used to migrate files from the on-premises file server or ECS to a database.Only FTP servers running Linux are supported.Do not change the password o", - "product_code":"dataartsstudio", - "title":"Link to an FTP or SFTP Server", - "uri":"dataartsstudio_01_0028.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"93" - }, - { - "desc":"The Redis link is applicable to data migration of Redis created in the local data center or ECS. It is used to load data in the database or files to Redis.Links to Redis ", - "product_code":"dataartsstudio", - "title":"Link to Redis", - "uri":"dataartsstudio_01_0032.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"94" - }, - { - "desc":"The DDS link is used to synchronize data from Document Database Service (DDS) on the cloud to a big data platform.When connecting CDM to DDS, configure the parameters as ", - "product_code":"dataartsstudio", - "title":"Link to DDS", - "uri":"dataartsstudio_01_0031.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"95" - }, - { - "desc":"When connecting CDM to CloudTable, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the password", - "product_code":"dataartsstudio", - "title":"Link to CloudTable", - "uri":"dataartsstudio_01_0027.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"96" - }, - { - "desc":"This link is used to transfer data from a third-party cloud MongoDB service or MongoDB created in the on-premises data center or ECS to a big data platform.When connectin", - "product_code":"dataartsstudio", - "title":"Link to MongoDB", - "uri":"dataartsstudio_01_0030.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"97" - }, - { - "desc":"Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.", - "product_code":"dataartsstudio", - "title":"Link to Cassandra", - "uri":"dataartsstudio_01_004501.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"98" - }, - { - "desc":"When connecting CDM to Kafka of MRS, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the passwo", - "product_code":"dataartsstudio", - "title":"Link to Kafka", - "uri":"dataartsstudio_01_0033.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"99" - }, - { - "desc":"When connecting CDM to DMS Kafka, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the password ", - "product_code":"dataartsstudio", - "title":"Link to DMS Kafka", - "uri":"dataartsstudio_01_0038.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"100" - }, - { - "desc":"Cloud Search Service (CSS) is a fully hosted distributed search service powered by open-source Elasticsearch. CSS links can be used to migrate log files and database reco", - "product_code":"dataartsstudio", - "title":"Link to CSS", - "uri":"dataartsstudio_01_0035.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"101" - }, - { - "desc":"Elasticsearch links can be used to connect to Elasticsearch services in third-party clouds and local data centers and on Elastic Cloud Servers (ECSs).The Elasticsearch co", - "product_code":"dataartsstudio", - "title":"Link to Elasticsearch", - "uri":"dataartsstudio_01_1380.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"102" - }, - { - "desc":"Table 1 describes the SAP HANA link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and", - "product_code":"dataartsstudio", - "title":"Link to SAP HANA", - "uri":"dataartsstudio_01_0227.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"103" - }, - { - "desc":"Sharding refers to the link to multiple backend data sources at the same time. The link can be used as the job source to migrate data from multiple data sources to other ", - "product_code":"dataartsstudio", - "title":"Link to a Database Shard", - "uri":"dataartsstudio_01_1214.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"104" - }, - { - "desc":"Table 1 describes the MRS Hudi link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and", - "product_code":"dataartsstudio", - "title":"Link to MRS Hudi", - "uri":"dataartsstudio_01_0184.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"105" - }, - { - "desc":"Table 1 describes the MRS ClickHouse link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediate", - "product_code":"dataartsstudio", - "title":"Link to MRS ClickHouse", - "uri":"dataartsstudio_01_0285.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"106" - }, - { - "desc":"Table 1 lists the parameters for a link to a ShenTong database.Do not change the password or user when the job is running. If you do so, the password will not take effect", - "product_code":"dataartsstudio", - "title":"Link to a ShenTong Database", - "uri":"dataartsstudio_01_0290.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"107" - }, - { - "desc":"When connecting CDM to CloudTable OpenTSDB, configure the parameters as described in Table 1.", - "product_code":"dataartsstudio", - "title":"Link to CloudTable OpenTSDB", - "uri":"dataartsstudio_01_0037.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"108" - }, - { - "desc":"CDM can connect to open-source Doris and MRS Doris. Table 1 lists the parameters for a Doris link.Do not change the password or user when the job is running. If you do so", - "product_code":"dataartsstudio", - "title":"Link to Doris", - "uri":"dataartsstudio_01_1215.html", - "doc_type":"usermanual", - "p_code":"79", - "code":"109" - }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Managing Jobs", + "title":"Configuring Link Parameters", + "uri":"dataartsstudio_01_0157.html", + "doc_type":"usermanual", + "p_code":"83", + "code":"85" + }, + { + "desc":"When connecting CDM to the destination OBS bucket, you need to add the read and write permissions to the destination OBS bucket, and file authentication is not required.I", + "product_code":"dataartsstudio", + "title":"OBS Link Parameters", + "uri":"dataartsstudio_01_0045.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"86" + }, + { + "desc":"Table 1 lists the parameters for creating a link to PostgreSQL/SQLServer. Greenplum, Kingbase, and GaussDB can be connected through the PostgreSQL connector. The source a", + "product_code":"dataartsstudio", + "title":"PostgreSQL/SQLServer Link Parameters", + "uri":"dataartsstudio_01_0044.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"87" + }, + { + "desc":"Table 1 describes the DWS link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the ", + "product_code":"dataartsstudio", + "title":"GaussDB(DWS) Link Parameters", + "uri":"dataartsstudio_01_0226.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"88" + }, + { + "desc":"Table 1 lists the parameters for a link to a MySQL database.Do not change the password or user when the job is running. If you do so, the password will not take effect im", + "product_code":"dataartsstudio", + "title":"RDS for MySQL/MySQL Database Link Parameters", + "uri":"dataartsstudio_01_1211.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"89" + }, + { + "desc":"Table 1 lists the parameters for a link to an Oracle database.Do not change the password or user when the job is running. If you do so, the password will not take effect ", + "product_code":"dataartsstudio", + "title":"Oracle Database Link Parameters", + "uri":"dataartsstudio_01_1212.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"90" + }, + { + "desc":"When connecting CDM to DLI, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the password will n", + "product_code":"dataartsstudio", + "title":"DLI Link Parameters", + "uri":"dataartsstudio_01_0036.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"91" + }, + { + "desc":"CDM supports the following Hive data sources:MRS HiveFusionInsight HiveApache HiveDo not change the password or user when the job is running. If you do so, the password w", + "product_code":"dataartsstudio", + "title":"Hive Link Parameters", + "uri":"dataartsstudio_01_0026.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"92" + }, + { + "desc":"CDM supports the following HBase data sources:MRS HBaseFusionInsight HBaseApache HBaseDo not change the password or user when the job is running. If you do so, the passwo", + "product_code":"dataartsstudio", + "title":"HBase Link Parameters", + "uri":"dataartsstudio_01_0039.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"93" + }, + { + "desc":"CDM supports the following HDFS data sources:MRS HDFSFusionInsight HDFSApache HDFSDo not change the password or user when the job is running. If you do so, the password w", + "product_code":"dataartsstudio", + "title":"HDFS Link Parameters", + "uri":"dataartsstudio_01_0040.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"94" + }, + { + "desc":"The FTP/SFTP link is used to migrate files from the on-premises file server or ECS to a database.Only FTP servers running Linux are supported.Do not change the password o", + "product_code":"dataartsstudio", + "title":"FTP/SFTP Link Parameters", + "uri":"dataartsstudio_01_0028.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"95" + }, + { + "desc":"The Redis link is applicable to data migration of Redis created in the local data center or ECS. It is used to load data in the database or files to Redis.Links to Redis ", + "product_code":"dataartsstudio", + "title":"Redis Link Parameters", + "uri":"dataartsstudio_01_0032.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"96" + }, + { + "desc":"The DDS link is used to synchronize data from Document Database Service (DDS) on the cloud to a big data platform.When connecting CDM to DDS, configure the parameters as ", + "product_code":"dataartsstudio", + "title":"DDS Link Parameters", + "uri":"dataartsstudio_01_0031.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"97" + }, + { + "desc":"When connecting CDM to CloudTable, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the password", + "product_code":"dataartsstudio", + "title":"CloudTable Link Parameters", + "uri":"dataartsstudio_01_0027.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"98" + }, + { + "desc":"This link is used to transfer data from a third-party cloud MongoDB service or MongoDB created in the on-premises data center or ECS to a big data platform.When connectin", + "product_code":"dataartsstudio", + "title":"MongoDB Link Parameters", + "uri":"dataartsstudio_01_0030.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"99" + }, + { + "desc":"Cassandra is not supported in version 2.9.3.300 or later.Do not change the password or user when a job is running. If you do so, the password will not take effect immedia", + "product_code":"dataartsstudio", + "title":"Cassandra Link Parameters", + "uri":"dataartsstudio_01_004501.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"100" + }, + { + "desc":"When connecting CDM to Kafka of MRS, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the passwo", + "product_code":"dataartsstudio", + "title":"Kafka Link Parameters", + "uri":"dataartsstudio_01_0033.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"101" + }, + { + "desc":"When connecting CDM to DMS Kafka, configure the parameters as described in Table 1.Do not change the password or user when the job is running. If you do so, the password ", + "product_code":"dataartsstudio", + "title":"DMS Kafka Link Parameters", + "uri":"dataartsstudio_01_0038.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"102" + }, + { + "desc":"Cloud Search Service (CSS) is a fully hosted distributed search service powered by open-source Elasticsearch. CSS links can be used to migrate log files and database reco", + "product_code":"dataartsstudio", + "title":"CSS Link Parameters", + "uri":"dataartsstudio_01_0035.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"103" + }, + { + "desc":"Elasticsearch links can be used to connect to Elasticsearch services in third-party clouds and local data centers and on Elastic Cloud Servers (ECSs).The Elasticsearch co", + "product_code":"dataartsstudio", + "title":"Elasticsearch Link Parameters", + "uri":"dataartsstudio_01_1380.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"104" + }, + { + "desc":"Table 1 describes the SAP HANA link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and", + "product_code":"dataartsstudio", + "title":"SAP HANA Link Parameters", + "uri":"dataartsstudio_01_0227.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"105" + }, + { + "desc":"Sharding refers to the link to multiple backend data sources at the same time. The link can be used as the job source to migrate data from multiple data sources to other ", + "product_code":"dataartsstudio", + "title":"Shard Link Parameters", + "uri":"dataartsstudio_01_1214.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"106" + }, + { + "desc":"Table 1 describes the MRS Hudi link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and", + "product_code":"dataartsstudio", + "title":"MRS Hudi Link Parameters", + "uri":"dataartsstudio_01_0184.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"107" + }, + { + "desc":"Table 1 describes the MRS ClickHouse link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediate", + "product_code":"dataartsstudio", + "title":"MRS ClickHouse Link Parameters", + "uri":"dataartsstudio_01_0285.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"108" + }, + { + "desc":"Table 1 lists the parameters for a link to a ShenTong database.Do not change the password or user when the job is running. If you do so, the password will not take effect", + "product_code":"dataartsstudio", + "title":"ShenTong Database Link Parameters", + "uri":"dataartsstudio_01_0290.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"109" + }, + { + "desc":"Table 1 describes the LogHub (SLS) link parameters.", + "product_code":"dataartsstudio", + "title":"LogHub (SLS) Link Parameters", + "uri":"dataartsstudio_01_0288.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"110" + }, + { + "desc":"When connecting CDM to CloudTable OpenTSDB, configure the parameters as described in Table 1.", + "product_code":"dataartsstudio", + "title":"CloudTable OpenTSDB Link Parameters", + "uri":"dataartsstudio_01_0037.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"111" + }, + { + "desc":"Table 1 describes the YASHAN link parameters.Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and t", + "product_code":"dataartsstudio", + "title":"YASHAN Link Parameters", + "uri":"dataartsstudio_01_1628.html", + "doc_type":"usermanual", + "p_code":"85", + "code":"112" + }, + { + "desc":"The Java Database Connectivity (JDBC) provides programmatic access to relational databases. Applications can execute SQL statements and retrieve data using the JDBC API.B", + "product_code":"dataartsstudio", + "title":"Uploading a CDM Link Driver", + "uri":"dataartsstudio_01_0132.html", + "doc_type":"usermanual", + "p_code":"83", + "code":"113" + }, + { + "desc":"On the Cluster Configurations page, you can create, edit, or delete Hadoop cluster configurations.When creating a Hadoop link, the Hadoop cluster configurations can simpl", + "product_code":"dataartsstudio", + "title":"Creating a Hadoop Cluster Configuration", + "uri":"dataartsstudio_01_1096.html", + "doc_type":"usermanual", + "p_code":"83", + "code":"114" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"Creating a Job in a CDM Cluster", "uri":"dataartsstudio_01_0081.html", "doc_type":"usermanual", - "p_code":"59", - "code":"110" + "p_code":"64", + "code":"115" }, { "desc":"CDM supports table and file migration between homogeneous or heterogeneous data sources. For details about supported data sources, see Supported Data Sources.The dirty da", @@ -995,8 +1040,8 @@ "title":"Table/File Migration Jobs", "uri":"dataartsstudio_01_0046.html", "doc_type":"usermanual", - "p_code":"110", - "code":"111" + "p_code":"115", + "code":"116" }, { "desc":"CDM supports entire DB migration between homogeneous and heterogeneous data sources. The migration principles are the same as those in Table/File Migration Jobs. Each typ", @@ -1004,17 +1049,17 @@ "title":"Creating an Entire Database Migration Job", "uri":"dataartsstudio_01_0075.html", "doc_type":"usermanual", - "p_code":"110", - "code":"112" + "p_code":"115", + "code":"117" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Source Job Parameters", + "title":"Configuring CDM Source Job Parameters", "uri":"dataartsstudio_01_0047.html", "doc_type":"usermanual", - "p_code":"110", - "code":"113" + "p_code":"115", + "code":"118" }, { "desc":"If the source link of a job is an OBS link, configure the source job parameters based on Table 1.Advanced attributes are optional and not displayed by default. You can cl", @@ -1022,8 +1067,8 @@ "title":"From OBS", "uri":"dataartsstudio_01_0048.html", "doc_type":"usermanual", - "p_code":"113", - "code":"114" + "p_code":"118", + "code":"119" }, { "desc":"If the source link of a job is an HDFS link, that is, if data is exported from MRS HDFS, FusionInsight HDFS, or Apache HDFS, configure the source job parameters based on ", @@ -1031,8 +1076,8 @@ "title":"From HDFS", "uri":"dataartsstudio_01_0049.html", "doc_type":"usermanual", - "p_code":"113", - "code":"115" + "p_code":"118", + "code":"120" }, { "desc":"If the source link of a job is an HBase or CloudTable link, that is, if data is exported from MRS HBase, FusionInsight HBase, CloudTable, or Apache HBase, configure the s", @@ -1040,8 +1085,8 @@ "title":"From HBase/CloudTable", "uri":"dataartsstudio_01_0050.html", "doc_type":"usermanual", - "p_code":"113", - "code":"116" + "p_code":"118", + "code":"121" }, { "desc":"If the source link of a job is a Hive link, configure the source job parameters based on Table 1.If the data source is Hive, CDM will automatically partition data using t", @@ -1049,17 +1094,17 @@ "title":"From Hive", "uri":"dataartsstudio_01_0051.html", "doc_type":"usermanual", - "p_code":"113", - "code":"117" + "p_code":"118", + "code":"122" }, { "desc":"If the source link of a job is a DLI link, configure the source job parameters based on Table 1.", "product_code":"dataartsstudio", "title":"From DLI", - "uri":"dataartsstudio_01_0120_0.html", + "uri":"dataartsstudio_01_0120.html", "doc_type":"usermanual", - "p_code":"113", - "code":"118" + "p_code":"118", + "code":"123" }, { "desc":"If the source link of a job is an FTP or SFTP link, configure the source job parameters based on Table 1.Advanced attributes are optional and not displayed by default. Yo", @@ -1067,8 +1112,8 @@ "title":"From FTP/SFTP", "uri":"dataartsstudio_01_0052.html", "doc_type":"usermanual", - "p_code":"113", - "code":"119" + "p_code":"118", + "code":"124" }, { "desc":"If the source link of a job is an HTTP link, configure the source job parameters based on Table 1. Currently, data can only be exported from the HTTP URLs.", @@ -1076,8 +1121,8 @@ "title":"From HTTP", "uri":"dataartsstudio_01_0053.html", "doc_type":"usermanual", - "p_code":"113", - "code":"120" + "p_code":"118", + "code":"125" }, { "desc":"If the source link of a job is an RDS for PostgreSQL, RDS for SQL Server, PostgreSQL, or Microsoft SQL Server link, configure the source job parameters based on Table 1.", @@ -1085,8 +1130,8 @@ "title":"From PostgreSQL/SQL Server", "uri":"dataartsstudio_01_0054.html", "doc_type":"usermanual", - "p_code":"113", - "code":"121" + "p_code":"118", + "code":"126" }, { "desc":"If the source link of a job is a DWS link, configure the source job parameters based on Table 1.", @@ -1094,8 +1139,8 @@ "title":"From DWS", "uri":"dataartsstudio_01_0387.html", "doc_type":"usermanual", - "p_code":"113", - "code":"122" + "p_code":"118", + "code":"127" }, { "desc":"Table 1 lists the job parameters when the source link is a SAP HANA link.", @@ -1103,8 +1148,8 @@ "title":"From SAP HANA", "uri":"dataartsstudio_01_0388.html", "doc_type":"usermanual", - "p_code":"113", - "code":"123" + "p_code":"118", + "code":"128" }, { "desc":"If the source link of a job is an RDS for MySQL or MySQL link, configure the source job parameters based on Table 1.", @@ -1112,8 +1157,8 @@ "title":"From MySQL", "uri":"dataartsstudio_01_1254.html", "doc_type":"usermanual", - "p_code":"113", - "code":"124" + "p_code":"118", + "code":"129" }, { "desc":"If the source link of a job is an Oracle link, configure the source job parameters based on Table 1.When an Oracle database is the migration source, if Partitioning Field", @@ -1121,8 +1166,8 @@ "title":"From Oracle", "uri":"dataartsstudio_01_1255.html", "doc_type":"usermanual", - "p_code":"113", - "code":"125" + "p_code":"118", + "code":"130" }, { "desc":"If the source link of a job is a database shard link, configure the source job parameters based on Table 1.If the Source Link Name is the backend link of the sharded link", @@ -1130,8 +1175,8 @@ "title":"From a Database Shard", "uri":"dataartsstudio_01_1256.html", "doc_type":"usermanual", - "p_code":"113", - "code":"126" + "p_code":"118", + "code":"131" }, { "desc":"When you migrate MongoDB or DDS data, CDM reads the first row of the collection as an example of the field list. If the first row of data does not contain all fields of t", @@ -1139,8 +1184,8 @@ "title":"From MongoDB/DDS", "uri":"dataartsstudio_01_0055.html", "doc_type":"usermanual", - "p_code":"113", - "code":"127" + "p_code":"118", + "code":"132" }, { "desc":"The Redis service of the third-party cloud cannot serve as the migration source. However, the Redis set up in the on-premises data center or on the ECS can be the migrati", @@ -1148,8 +1193,8 @@ "title":"From Redis", "uri":"dataartsstudio_01_0056.html", "doc_type":"usermanual", - "p_code":"113", - "code":"128" + "p_code":"118", + "code":"133" }, { "desc":"If the source link of a job is a Kafka link or DMS Kafka link, configure the source job parameters based on Table 1.", @@ -1157,17 +1202,17 @@ "title":"From Kafka/DMS Kafka", "uri":"dataartsstudio_01_0058.html", "doc_type":"usermanual", - "p_code":"113", - "code":"129" + "p_code":"118", + "code":"134" }, { - "desc":"If the source link of a job is a link described in Link to Elasticsearch or Link to CSS, configure the source job parameters based on Table 1.", + "desc":"If the source link of a job is a link described in Elasticsearch Link Parameters or CSS Link Parameters, configure the source job parameters based on Table 1.", "product_code":"dataartsstudio", "title":"From Elasticsearch or CSS", "uri":"dataartsstudio_01_0059.html", "doc_type":"usermanual", - "p_code":"113", - "code":"130" + "p_code":"118", + "code":"135" }, { "desc":"If the source link of a job is a CloudTable OpenTSDB link, configure the source job parameters based on Table 1.", @@ -1175,8 +1220,8 @@ "title":"From OpenTSDB", "uri":"dataartsstudio_01_0060.html", "doc_type":"usermanual", - "p_code":"113", - "code":"131" + "p_code":"118", + "code":"136" }, { "desc":"If the source link of a job is an MRS Hudi link, configure the source job parameters based on Table 1.", @@ -1184,8 +1229,8 @@ "title":"From MRS Hudi", "uri":"dataartsstudio_01_0185.html", "doc_type":"usermanual", - "p_code":"113", - "code":"132" + "p_code":"118", + "code":"137" }, { "desc":"If the source link of a job is an MRS ClickHouse link, configure the source job parameters based on Table 1.", @@ -1193,8 +1238,17 @@ "title":"From MRS ClickHouse", "uri":"dataartsstudio_01_0286.html", "doc_type":"usermanual", - "p_code":"113", - "code":"133" + "p_code":"118", + "code":"138" + }, + { + "desc":"If the source link of a job is a LogHub (SLS) link, configure the source job parameters based on Table 1.", + "product_code":"dataartsstudio", + "title":"From LogHub (SLS)", + "uri":"dataartsstudio_01_0289.html", + "doc_type":"usermanual", + "p_code":"118", + "code":"139" }, { "desc":"If the source link of a job is a ShenTong database link, configure the source job parameters based on Table 1.", @@ -1202,26 +1256,26 @@ "title":"From a ShenTong Database", "uri":"dataartsstudio_01_0291.html", "doc_type":"usermanual", - "p_code":"113", - "code":"134" + "p_code":"118", + "code":"140" }, { - "desc":"If the source link of a job is a Doris link, configure the source job parameters based on Table 1.", + "desc":"If the source link of a job is a YASHAN link, configure the source job parameters based on Table 1.", "product_code":"dataartsstudio", - "title":"From Doris", - "uri":"dataartsstudio_01_0136.html", + "title":"From YASHAN", + "uri":"dataartsstudio_01_1629.html", "doc_type":"usermanual", - "p_code":"113", - "code":"135" + "p_code":"118", + "code":"141" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Destination Job Parameters", + "title":"Configuring CDM Destination Job Parameters", "uri":"dataartsstudio_01_0061.html", "doc_type":"usermanual", - "p_code":"110", - "code":"136" + "p_code":"115", + "code":"142" }, { "desc":"If the destination link of a job is an OBS link, that is, data is to be imported to OBS, configure the destination job parameters based on Table 1.Advanced attributes are", @@ -1229,8 +1283,8 @@ "title":"To OBS", "uri":"dataartsstudio_01_0062.html", "doc_type":"usermanual", - "p_code":"136", - "code":"137" + "p_code":"142", + "code":"143" }, { "desc":"If the destination link of a job is an HDFS link, configure the destination job parameters based on Table 1.HDFS supports the UTF-8 encoding only. Retain the default valu", @@ -1238,8 +1292,8 @@ "title":"To HDFS", "uri":"dataartsstudio_01_0063.html", "doc_type":"usermanual", - "p_code":"136", - "code":"138" + "p_code":"142", + "code":"144" }, { "desc":"If the destination link of a job is an HBase link or CloudTable link, configure the destination job parameters based on Table 1.", @@ -1247,17 +1301,17 @@ "title":"To HBase/CloudTable", "uri":"dataartsstudio_01_0064.html", "doc_type":"usermanual", - "p_code":"136", - "code":"139" + "p_code":"142", + "code":"145" }, { - "desc":"If the destination link of a job is a Hive link, configure the destination job parameters based on Table 1.When Hive serves as the destination end, a table whose storage ", + "desc":"If the destination link of a job is a Hive link, configure the destination job parameters based on Table 1.If the source Hive contains both the array and map types of dat", "product_code":"dataartsstudio", "title":"To Hive", "uri":"dataartsstudio_01_0066.html", "doc_type":"usermanual", - "p_code":"136", - "code":"140" + "p_code":"142", + "code":"146" }, { "desc":"Table 1 lists the destination job parameters when the destination link is an MySQL, SQL Server, or PostgreSQL link.", @@ -1265,8 +1319,8 @@ "title":"To MySQL/SQL Server/PostgreSQL", "uri":"dataartsstudio_01_0068.html", "doc_type":"usermanual", - "p_code":"136", - "code":"141" + "p_code":"142", + "code":"147" }, { "desc":"If the destination link of a job is an Oracle database link, configure the destination job parameters based on Table 1.", @@ -1274,8 +1328,8 @@ "title":"To Oracle", "uri":"dataartsstudio_01_0252.html", "doc_type":"usermanual", - "p_code":"136", - "code":"142" + "p_code":"142", + "code":"148" }, { "desc":"If the destination link of a job is a DWS link, configure the destination job parameters based on Table 1.Figure 1 describes the field mapping between DWS tables created ", @@ -1283,8 +1337,8 @@ "title":"To DWS", "uri":"dataartsstudio_01_1251.html", "doc_type":"usermanual", - "p_code":"136", - "code":"143" + "p_code":"142", + "code":"149" }, { "desc":"If the destination link of a job is a DDS link, configure the destination job parameters based on Table 1.Parameter descriptionParameterDescriptionExample ValueDatabase N", @@ -1292,8 +1346,8 @@ "title":"To DDS", "uri":"dataartsstudio_01_0069.html", "doc_type":"usermanual", - "p_code":"136", - "code":"144" + "p_code":"142", + "code":"150" }, { "desc":"Table 1 lists the destination job parameters when the destination link is a Redis link.Parameter descriptionParameterDescriptionExample ValueRedis Key PrefixKey prefix, w", @@ -1301,26 +1355,26 @@ "title":"To Redis", "uri":"dataartsstudio_01_0070.html", "doc_type":"usermanual", - "p_code":"136", - "code":"145" + "p_code":"142", + "code":"151" }, { - "desc":"If the destination link of a job is a link described in Link to Elasticsearch or Link to CSS, configure the destination job parameters based on Table 1.", + "desc":"If the destination link of a job is a link described in Elasticsearch Link Parameters or CSS Link Parameters, configure the destination job parameters based on Table 1.Th", "product_code":"dataartsstudio", "title":"To Elasticsearch/CSS", "uri":"dataartsstudio_01_0071.html", "doc_type":"usermanual", - "p_code":"136", - "code":"146" + "p_code":"142", + "code":"152" }, { - "desc":"If the destination link of a job is a DLI link, configure the destination job parameters based on Table 1.When you use CDM to migrate data to DLI, DLI generates data file", + "desc":"If the destination link of a job is a DLI link, configure the destination job parameters based on Table 1.When data is migrated to DLI using CDM, DLI generates data files", "product_code":"dataartsstudio", "title":"To DLI", "uri":"dataartsstudio_01_0072.html", "doc_type":"usermanual", - "p_code":"136", - "code":"147" + "p_code":"142", + "code":"153" }, { "desc":"If the destination link of a job is a CloudTable OpenTSDB link, configure the destination job parameters based on Table 1.", @@ -1328,8 +1382,8 @@ "title":"To OpenTSDB", "uri":"dataartsstudio_01_0074.html", "doc_type":"usermanual", - "p_code":"136", - "code":"148" + "p_code":"142", + "code":"154" }, { "desc":"If the destination link of a job is an MRS Hudi link, configure the destination job parameters based on Table 1.", @@ -1337,8 +1391,8 @@ "title":"To MRS Hudi", "uri":"dataartsstudio_01_0186.html", "doc_type":"usermanual", - "p_code":"136", - "code":"149" + "p_code":"142", + "code":"155" }, { "desc":"If the destination link of a job is an MRS ClickHouse link, configure the destination job parameters based on Table 1.If the source link of the job is an MRS ClickHouse, ", @@ -1346,8 +1400,8 @@ "title":"To MRS ClickHouse", "uri":"dataartsstudio_01_0287.html", "doc_type":"usermanual", - "p_code":"136", - "code":"150" + "p_code":"142", + "code":"156" }, { "desc":"If the destination link of a job is a MongoDB link, configure the destination job parameters based on Table 1.", @@ -1355,197 +1409,188 @@ "title":"To MongoDB", "uri":"dataartsstudio_01_0332.html", "doc_type":"usermanual", - "p_code":"136", - "code":"151" - }, - { - "desc":"Table 1 lists the destination job parameters when the destination link is a Doris link.", - "product_code":"dataartsstudio", - "title":"To Doris", - "uri":"dataartsstudio_01_0999.html", - "doc_type":"usermanual", - "p_code":"136", - "code":"152" + "p_code":"142", + "code":"157" }, { "desc":"After the job parameters are configured, you can configure field mapping. You can click on the Map Field page to customize new fields or click in the Operation column t", "product_code":"dataartsstudio", - "title":"Configuring Field Mapping", + "title":"Configuring CDM Job Field Mapping", "uri":"dataartsstudio_01_0261.html", "doc_type":"usermanual", - "p_code":"110", - "code":"153" + "p_code":"115", + "code":"158" }, { "desc":"CDM supports scheduled execution of table/file migration jobs by minute, hour, day, week, and month. This section describes how to configure scheduled job parameters.When", "product_code":"dataartsstudio", - "title":"Scheduling Job Execution", + "title":"Configuring a Scheduled CDM Job", "uri":"dataartsstudio_01_0082.html", "doc_type":"usermanual", - "p_code":"110", - "code":"154" + "p_code":"115", + "code":"159" }, { "desc":"On the Settings tab page, you can perform the following operations:Maximum Concurrent ExtractorsScheduled Backup/RestorationEnvironment Variables of Job ParametersMaximum", "product_code":"dataartsstudio", - "title":"Job Configuration Management", + "title":"Managing CDM Job Configuration", "uri":"dataartsstudio_01_0083.html", "doc_type":"usermanual", - "p_code":"110", - "code":"155" + "p_code":"115", + "code":"160" }, { "desc":"Existing CDM jobs can be viewed, modified, deleted, started, and stopped. This section describes how to view and modify a job.Viewing job statusThe job status can be New,", "product_code":"dataartsstudio", - "title":"Managing a Single Job", + "title":"Managing a CDM Job", "uri":"dataartsstudio_01_0084.html", "doc_type":"usermanual", - "p_code":"110", - "code":"156" - }, - { - "desc":"This section describes how to manage CDM table/file migration jobs in batches. The following operations are involved:Manage jobs by group.Run jobs in batches.Delete jobs ", - "product_code":"dataartsstudio", - "title":"Managing Jobs in Batches", - "uri":"dataartsstudio_01_0085.html", - "doc_type":"usermanual", - "p_code":"110", - "code":"157" - }, - { - "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "product_code":"dataartsstudio", - "title":"Improving Migration Performance", - "uri":"dataartsstudio_01_0018.html", - "doc_type":"usermanual", - "p_code":"59", - "code":"158" - }, - { - "desc":"Figure 1 shows the simplified migration model used by CDM.CDM migrates data through data migration jobs. It works in the following way:When data migration jobs are submit", - "product_code":"dataartsstudio", - "title":"How Migration Jobs Work", - "uri":"dataartsstudio_01_0025.html", - "doc_type":"usermanual", - "p_code":"158", - "code":"159" - }, - { - "desc":"In addition to increasing the source read speed, improving the destination write performance, and increasing the bandwidth, you can accelerate migration using the followi", - "product_code":"dataartsstudio", - "title":"Performance Tuning", - "uri":"dataartsstudio_01_0076.html", - "doc_type":"usermanual", - "p_code":"158", - "code":"160" - }, - { - "desc":"CDM splits jobs for different data sources based on different dimensions. Table 1 lists the splitting dimensions.", - "product_code":"dataartsstudio", - "title":"Reference: Job Splitting Dimensions", - "uri":"dataartsstudio_01_0078.html", - "doc_type":"usermanual", - "p_code":"158", + "p_code":"115", "code":"161" }, { - "desc":"The performance metrics provided in this document are for reference only. The performance at your site may be affected by factors such as the data source performance at t", + "desc":"This section describes how to manage CDM table/file migration jobs in batches. The following operations are supported:Managing jobs by groupRunning jobs in batchesDeletin", "product_code":"dataartsstudio", - "title":"Reference: CDM Performance Test Data", - "uri":"dataartsstudio_01_0077.html", + "title":"Managing CDM Jobs", + "uri":"dataartsstudio_01_0085.html", "doc_type":"usermanual", - "p_code":"158", + "p_code":"115", "code":"162" }, - { - "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "product_code":"dataartsstudio", - "title":"Key Operation Guide", - "uri":"dataartsstudio_01_0110.html", - "doc_type":"usermanual", - "p_code":"59", - "code":"163" - }, - { - "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", - "product_code":"dataartsstudio", - "title":"Incremental Migration", - "uri":"dataartsstudio_01_0111.html", - "doc_type":"usermanual", - "p_code":"163", - "code":"164" - }, - { - "desc":"CDM supports incremental migration of file systems. After full migration is complete, all new files or only specified directories or files can be exported.Currently, CDM ", - "product_code":"dataartsstudio", - "title":"Incremental File Migration", - "uri":"dataartsstudio_01_0112.html", - "doc_type":"usermanual", - "p_code":"164", - "code":"165" - }, - { - "desc":"CDM supports incremental migration of relational databases. After a full migration is complete, data in a specified period can be incrementally migrated. For example, dat", - "product_code":"dataartsstudio", - "title":"Incremental Migration of Relational Databases", - "uri":"dataartsstudio_01_0113.html", - "doc_type":"usermanual", - "p_code":"164", - "code":"166" - }, - { - "desc":"You can use CDM to export data in a specified period of time from HBase (including MRS HBase, FusionInsight HBase, and Apache HBase) and CloudTable. The CDM scheduled job", - "product_code":"dataartsstudio", - "title":"HBase/CloudTable Incremental Migration", - "uri":"dataartsstudio_01_0115_0.html", - "doc_type":"usermanual", - "p_code":"164", - "code":"167" - }, - { - "desc":"By using CDM, you can export MongoDB or DDS data within a specified period. With the scheduled jobs of CDM, you can implement incremental migration of MongoDB and DDS.If ", - "product_code":"dataartsstudio", - "title":"MongoDB/DDS Incremental Migration", - "uri":"dataartsstudio_01_0125.html", - "doc_type":"usermanual", - "p_code":"164", - "code":"168" - }, { "desc":"During the creation of table/file migration jobs, CDM supports the macro variables of date and time in the following parameters of the source and destination links:Source", "product_code":"dataartsstudio", "title":"Using Macro Variables of Date and Time", "uri":"dataartsstudio_01_0114.html", "doc_type":"usermanual", - "p_code":"163", + "p_code":"64", + "code":"163" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"Improving Migration Performance", + "uri":"dataartsstudio_01_0018.html", + "doc_type":"usermanual", + "p_code":"64", + "code":"164" + }, + { + "desc":"Figure 1 shows the simplified migration model used by CDM.CDM migrates data through data migration jobs. It works in the following way:When data migration jobs are submit", + "product_code":"dataartsstudio", + "title":"How Migration Jobs Work", + "uri":"dataartsstudio_01_0025.html", + "doc_type":"usermanual", + "p_code":"164", + "code":"165" + }, + { + "desc":"In addition to increasing the source read speed, improving the destination write performance, and increasing the bandwidth, you can accelerate migration using the followi", + "product_code":"dataartsstudio", + "title":"Performance Tuning", + "uri":"dataartsstudio_01_0076.html", + "doc_type":"usermanual", + "p_code":"164", + "code":"166" + }, + { + "desc":"CDM splits jobs for different data sources based on different dimensions. Table 1 lists the splitting dimensions.", + "product_code":"dataartsstudio", + "title":"Reference: Job Splitting Dimensions", + "uri":"dataartsstudio_01_0078.html", + "doc_type":"usermanual", + "p_code":"164", + "code":"167" + }, + { + "desc":"The performance metrics provided in this document are for reference only. The performance at your site may be affected by factors such as the data source performance at t", + "product_code":"dataartsstudio", + "title":"Reference: CDM Performance Test Data", + "uri":"dataartsstudio_01_0077.html", + "doc_type":"usermanual", + "p_code":"164", + "code":"168" + }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"Key Operation Guide", + "uri":"dataartsstudio_01_0110.html", + "doc_type":"usermanual", + "p_code":"64", "code":"169" }, + { + "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", + "product_code":"dataartsstudio", + "title":"Incremental Migration", + "uri":"dataartsstudio_01_0111.html", + "doc_type":"usermanual", + "p_code":"169", + "code":"170" + }, + { + "desc":"CDM supports incremental migration of file systems. After full migration is complete, all new files or only specified directories or files can be exported.Currently, CDM ", + "product_code":"dataartsstudio", + "title":"Incremental File Migration", + "uri":"dataartsstudio_01_0112.html", + "doc_type":"usermanual", + "p_code":"170", + "code":"171" + }, + { + "desc":"CDM supports incremental migration of relational databases. After a full migration is complete, data in a specified period can be incrementally migrated. For example, dat", + "product_code":"dataartsstudio", + "title":"Incremental Migration of Relational Databases", + "uri":"dataartsstudio_01_0113.html", + "doc_type":"usermanual", + "p_code":"170", + "code":"172" + }, + { + "desc":"You can use CDM to export data in a specified period of time from HBase (including MRS HBase, FusionInsight HBase, and Apache HBase) and CloudTable. The CDM scheduled job", + "product_code":"dataartsstudio", + "title":"HBase/CloudTable Incremental Migration", + "uri":"dataartsstudio_01_0137.html", + "doc_type":"usermanual", + "p_code":"170", + "code":"173" + }, + { + "desc":"By using CDM, you can export MongoDB or DDS data within a specified period. With the scheduled jobs of CDM, you can implement incremental migration of MongoDB and DDS.If ", + "product_code":"dataartsstudio", + "title":"MongoDB/DDS Incremental Migration", + "uri":"dataartsstudio_01_0125.html", + "doc_type":"usermanual", + "p_code":"170", + "code":"174" + }, { "desc":"When a CDM job fails to be executed, CDM rolls back the data to the state before the job starts and automatically deletes data from the destination table.Parameter positi", "product_code":"dataartsstudio", "title":"Migration in Transaction Mode", - "uri":"dataartsstudio_01_0116_0.html", + "uri":"dataartsstudio_01_0589.html", "doc_type":"usermanual", - "p_code":"163", - "code":"170" + "p_code":"169", + "code":"175" }, { "desc":"When you migrate files to a file system, CDM can encrypt and decrypt those files. Currently, CDM supports the following encryption modes:AES-256-GCMKMS EncryptionAES-256-", "product_code":"dataartsstudio", "title":"Encryption and Decryption During File Migration", - "uri":"dataartsstudio_01_0117_0.html", + "uri":"dataartsstudio_01_0590.html", "doc_type":"usermanual", - "p_code":"163", - "code":"171" + "p_code":"169", + "code":"176" }, { "desc":"CDM extracts data from the migration source and writes the data to the migration destination. Figure 1 shows the migration mode when files are migrated to OBS.During the ", "product_code":"dataartsstudio", "title":"MD5 Verification", - "uri":"dataartsstudio_01_0118_0.html", + "uri":"dataartsstudio_01_0591.html", "doc_type":"usermanual", - "p_code":"163", - "code":"172" + "p_code":"169", + "code":"177" }, { "desc":"After the job parameters are configured, field mapping needs to be configured. You can click in the Operation column to create a field converter.If files are migrated be", @@ -1553,8 +1598,8 @@ "title":"Configuring Field Converters", "uri":"dataartsstudio_01_0104.html", "doc_type":"usermanual", - "p_code":"163", - "code":"173" + "p_code":"169", + "code":"178" }, { "desc":"After job parameters are configured, field mapping needs to be configured. You can customize new fields by clicking on the Map Field page.If files are migrated between F", @@ -1562,26 +1607,26 @@ "title":"Adding Fields", "uri":"dataartsstudio_01_0304.html", "doc_type":"usermanual", - "p_code":"163", - "code":"174" + "p_code":"169", + "code":"179" }, { "desc":"You can migrate files (a maximum of 50) with specified names from FTP, OBS, or SFTP at a time. The exported files can only be written to the same directory on the migrati", "product_code":"dataartsstudio", "title":"Migrating Files with Specified Names", - "uri":"dataartsstudio_01_0105.html", + "uri":"dataartsstudio_01_0592.html", "doc_type":"usermanual", - "p_code":"163", - "code":"175" + "p_code":"169", + "code":"180" }, { "desc":"During table/file migration, CDM uses delimiters to separate fields in CSV files. However, delimiters cannot be used in complex semi-structured data because the field val", "product_code":"dataartsstudio", "title":"Regular Expressions for Separating Semi-structured Text", - "uri":"dataartsstudio_01_0106.html", + "uri":"dataartsstudio_01_0593.html", "doc_type":"usermanual", - "p_code":"163", - "code":"176" + "p_code":"169", + "code":"181" }, { "desc":"When you create a job on the CDM console to migrate tables or files of a relational database, you can add a field to record the time when they were written to the databas", @@ -1589,8 +1634,8 @@ "title":"Recording the Time When Data Is Written to the Database", "uri":"dataartsstudio_01_0109.html", "doc_type":"usermanual", - "p_code":"163", - "code":"177" + "p_code":"169", + "code":"182" }, { "desc":"When creating a CDM job, you need to specify File Format in the job parameters of the migration source and destination in some scenarios. This section describes the appli", @@ -1598,8 +1643,8 @@ "title":"File Formats", "uri":"dataartsstudio_01_0108.html", "doc_type":"usermanual", - "p_code":"163", - "code":"178" + "p_code":"169", + "code":"183" }, { "desc":"When field mapping is configured on CDM, a message is displayed indicating that the data type of the field is not supported and the field needs to be deleted. If you need", @@ -1607,17 +1652,17 @@ "title":"Converting Unsupported Data Types", "uri":"dataartsstudio_01_0209.html", "doc_type":"usermanual", - "p_code":"163", - "code":"179" + "p_code":"169", + "code":"184" }, { - "desc":"Figure 1 describes the field mapping between the DWS tables created by CDM and source tables. For example, if you use CDM to migrate the Oracle database to DWS, CDM autom", + "desc":"CDM converts the field type of the source to the field type of the destination based on the default rule and creates a table at the destination.Figure 1 describes the fie", "product_code":"dataartsstudio", "title":"Auto Table Creation", "uri":"dataartsstudio_01_2000.html", "doc_type":"usermanual", - "p_code":"163", - "code":"180" + "p_code":"169", + "code":"185" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -1625,8 +1670,8 @@ "title":"Tutorials", "uri":"dataartsstudio_01_0086.html", "doc_type":"usermanual", - "p_code":"59", - "code":"181" + "p_code":"64", + "code":"186" }, { "desc":"MRS Hive links are applicable to the MapReduce Service (MRS). This tutorial describes how to create an MRS Hive link.You have created a CDM cluster.You have obtained the ", @@ -1634,8 +1679,8 @@ "title":"Creating an MRS Hive Link", "uri":"dataartsstudio_01_0130.html", "doc_type":"usermanual", - "p_code":"181", - "code":"182" + "p_code":"186", + "code":"187" }, { "desc":"MySQL links are applicable to third-party cloud MySQL services and MySQL created in a local data center or ECS. This tutorial describes how to create a MySQL link.You hav", @@ -1643,8 +1688,8 @@ "title":"Creating a MySQL Link", "uri":"dataartsstudio_01_0131.html", "doc_type":"usermanual", - "p_code":"181", - "code":"183" + "p_code":"186", + "code":"188" }, { "desc":"MRS provides enterprise-level big data clusters on the cloud. It contains HDFS, Hive, and Spark components and is applicable to massive data analysis of enterprises.Hive ", @@ -1652,8 +1697,8 @@ "title":"Migrating Data from MySQL to MRS Hive", "uri":"dataartsstudio_01_0092.html", "doc_type":"usermanual", - "p_code":"181", - "code":"184" + "p_code":"186", + "code":"189" }, { "desc":"CDM supports table-to-OBS data migration. This section describes how to migrate tables from a MySQL database to OBS. The process is as follows:Creating a CDM Cluster and ", @@ -1661,8 +1706,8 @@ "title":"Migrating Data from MySQL to OBS", "uri":"dataartsstudio_01_0100.html", "doc_type":"usermanual", - "p_code":"181", - "code":"185" + "p_code":"186", + "code":"190" }, { "desc":"CDM supports table-to-table data migration. This section describes how to migrate data from MySQL to DWS. The process is as follows:Creating a CDM Cluster and Binding an ", @@ -1670,8 +1715,8 @@ "title":"Migrating Data from MySQL to DWS", "uri":"dataartsstudio_01_0101.html", "doc_type":"usermanual", - "p_code":"181", - "code":"186" + "p_code":"186", + "code":"191" }, { "desc":"This section describes how to migrate the entire on-premises MySQL database to RDS using the CDM's entire DB migration function.Currently, CDM can migrate the entire on-p", @@ -1679,8 +1724,8 @@ "title":"Migrating an Entire MySQL Database to RDS", "uri":"dataartsstudio_01_0098.html", "doc_type":"usermanual", - "p_code":"181", - "code":"187" + "p_code":"186", + "code":"192" }, { "desc":"Cloud Search Service provides users with structured and unstructured data search, statistics, and report capabilities. This section describes how to use CDM to migrate da", @@ -1688,8 +1733,8 @@ "title":"Migrating Data from Oracle to CSS", "uri":"dataartsstudio_01_0091.html", "doc_type":"usermanual", - "p_code":"181", - "code":"188" + "p_code":"186", + "code":"193" }, { "desc":"CDM supports table-to-table migration. This section describes how to use CDM to migrate data from Oracle to Data Warehouse Service (DWS). The procedure is as follows:Crea", @@ -1697,8 +1742,8 @@ "title":"Migrating Data from Oracle to DWS", "uri":"dataartsstudio_01_0133.html", "doc_type":"usermanual", - "p_code":"181", - "code":"189" + "p_code":"186", + "code":"194" }, { "desc":"CDM supports data migration between cloud services. This section describes how to use CDM to migrate data from OBS to CSS. The procedure is as follows:Creating a CDM Clus", @@ -1706,8 +1751,8 @@ "title":"Migrating Data from OBS to CSS", "uri":"dataartsstudio_01_0088.html", "doc_type":"usermanual", - "p_code":"181", - "code":"190" + "p_code":"186", + "code":"195" }, { "desc":"DLI is a fully hosted big data query service. This section describes how to use CDM to migrate data from OBS to DLI. The procedure includes four steps:Creating a CDM Clus", @@ -1715,8 +1760,8 @@ "title":"Migrating Data from OBS to DLI", "uri":"dataartsstudio_01_0089.html", "doc_type":"usermanual", - "p_code":"181", - "code":"191" + "p_code":"186", + "code":"196" }, { "desc":"CDM supports file-to-file data migration. This section describes how to migrate data from MRS HDFS to OBS. The process is as follows:Creating a CDM Cluster and Binding an", @@ -1724,8 +1769,8 @@ "title":"Migrating Data from MRS HDFS to OBS", "uri":"dataartsstudio_01_0103.html", "doc_type":"usermanual", - "p_code":"181", - "code":"192" + "p_code":"186", + "code":"197" }, { "desc":"CSS provides users with structured and unstructured data search, statistics, and report capabilities. This section describes how to use CDM to migrate the entire Elastics", @@ -1733,8 +1778,8 @@ "title":"Migrating the Entire Elasticsearch Database to CSS", "uri":"dataartsstudio_01_0099.html", "doc_type":"usermanual", - "p_code":"181", - "code":"193" + "p_code":"186", + "code":"198" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -1742,8 +1787,8 @@ "title":"DataArts Factory", "uri":"dataartsstudio_01_0400.html", "doc_type":"usermanual", - "p_code":"25", - "code":"194" + "p_code":"11", + "code":"199" }, { "desc":"DataArts Factory is a one-stop big data collaborative development platform that provides fully managed big data scheduling capabilities. It manages various big data servi", @@ -1751,8 +1796,8 @@ "title":"Overview", "uri":"dataartsstudio_01_0401.html", "doc_type":"usermanual", - "p_code":"194", - "code":"195" + "p_code":"199", + "code":"200" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -1760,8 +1805,8 @@ "title":"Data Management", "uri":"dataartsstudio_01_0403.html", "doc_type":"usermanual", - "p_code":"194", - "code":"196" + "p_code":"199", + "code":"201" }, { "desc":"The data management function helps you quickly establish data models and provides you with data entities for script and job development. With data management, you can:Man", @@ -1769,17 +1814,17 @@ "title":"Data Management Process", "uri":"dataartsstudio_01_0402.html", "doc_type":"usermanual", - "p_code":"196", - "code":"197" + "p_code":"201", + "code":"202" }, { - "desc":"After a data connection is created, you can perform data operations on DataArts Factory, for example, managing databases, namespaces, database schema, and tables.With one", + "desc":"After creating a data connection, you can perform data operations on DataArts Factory, for example, managing databases, namespaces, database schema, and tables.With one d", "product_code":"dataartsstudio", "title":"Creating a Data Connection", "uri":"dataartsstudio_01_0404.html", "doc_type":"usermanual", - "p_code":"196", - "code":"198" + "p_code":"201", + "code":"203" }, { "desc":"After creating a data connection, you can create a database on the console or using a SQL script.(Recommended) Console: You can directly create a database on the DataArts", @@ -1787,17 +1832,17 @@ "title":"Creating a Database", "uri":"dataartsstudio_01_0405.html", "doc_type":"usermanual", - "p_code":"196", - "code":"199" + "p_code":"201", + "code":"204" }, { - "desc":"After creating a DWS data connection, you can manage the database schemas under the DWS data connection.A DWS data connection has been created. For details, see Creating ", + "desc":"After creating a DWS data connection, you can manage the database schemas under the DWS data connection.If existing database schemas meet your requirements, skip this sec", "product_code":"dataartsstudio", "title":"(Optional) Creating a Database Schema", "uri":"dataartsstudio_01_0412.html", "doc_type":"usermanual", - "p_code":"196", - "code":"200" + "p_code":"201", + "code":"205" }, { "desc":"You can create a table on the DataArts Factory console, in DDL mode, or using a SQL script.(Recommended) Console: You can directly create a table on the DataArts Studio D", @@ -1805,8 +1850,8 @@ "title":"Creating a Table", "uri":"dataartsstudio_01_0416.html", "doc_type":"usermanual", - "p_code":"196", - "code":"201" + "p_code":"201", + "code":"206" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -1814,8 +1859,8 @@ "title":"Script Development", "uri":"dataartsstudio_01_0421.html", "doc_type":"usermanual", - "p_code":"194", - "code":"202" + "p_code":"199", + "code":"207" }, { "desc":"The script development function provides the following capabilities:Provides an online script editor for developing and debugging SQL, Python, and Shell scripts.Supports ", @@ -1823,8 +1868,8 @@ "title":"Script Development Process", "uri":"dataartsstudio_01_0422.html", "doc_type":"usermanual", - "p_code":"202", - "code":"203" + "p_code":"207", + "code":"208" }, { "desc":"DataArts Factory allows you to create, edit, debug, and run SQL, Python, and Shell scripts. Before developing a script, you must create one.You have completed operations ", @@ -1832,8 +1877,8 @@ "title":"Creating a Script", "uri":"dataartsstudio_01_0423.html", "doc_type":"usermanual", - "p_code":"202", - "code":"204" + "p_code":"207", + "code":"209" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -1841,8 +1886,8 @@ "title":"Developing Scripts", "uri":"dataartsstudio_01_0406.html", "doc_type":"usermanual", - "p_code":"202", - "code":"205" + "p_code":"207", + "code":"210" }, { "desc":"DataArts Factory allows you to develop, debug, and run SQL scripts online. You can run developed scripts in jobs. For details, see Developing a Pipeline Job.DataArts Fact", @@ -1850,8 +1895,8 @@ "title":"Developing an SQL Script", "uri":"dataartsstudio_01_0424.html", "doc_type":"usermanual", - "p_code":"205", - "code":"206" + "p_code":"210", + "code":"211" }, { "desc":"DataArts Factory allows you to develop, debug, and run Shell scripts online. You can run developed scripts in jobs. For details, see Developing a Pipeline Job.A shell scr", @@ -1859,8 +1904,8 @@ "title":"Developing a Shell Script", "uri":"dataartsstudio_01_0425.html", "doc_type":"usermanual", - "p_code":"205", - "code":"207" + "p_code":"210", + "code":"212" }, { "desc":"DataArts Factory allows you to develop, debug, and run Python scripts online. You can run developed scripts in jobs. For details, see Developing a Pipeline Job.For detail", @@ -1868,8 +1913,8 @@ "title":"Developing a Python Script", "uri":"dataartsstudio_01_4503.html", "doc_type":"usermanual", - "p_code":"205", - "code":"208" + "p_code":"210", + "code":"213" }, { "desc":"Submitting a version depends on the version management function of DataArts Factory.Version management traces script and job changes, and supports version comparison and ", @@ -1877,8 +1922,8 @@ "title":"Submitting a Version", "uri":"dataartsstudio_01_0901.html", "doc_type":"usermanual", - "p_code":"202", - "code":"209" + "p_code":"207", + "code":"214" }, { "desc":"In enterprise mode, when a developer submits a script version, the system generates a script release task. After the developer confirms releasing a package and the admin,", @@ -1886,8 +1931,8 @@ "title":"Releasing a Script Task", "uri":"dataartsstudio_01_1902.html", "doc_type":"usermanual", - "p_code":"202", - "code":"210" + "p_code":"207", + "code":"215" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -1895,8 +1940,8 @@ "title":"(Optional) Managing Scripts", "uri":"dataartsstudio_01_0407.html", "doc_type":"usermanual", - "p_code":"202", - "code":"211" + "p_code":"207", + "code":"216" }, { "desc":"This section describes how to copy a script.A script has been developed based on Developing Scripts.Log in to the DataArts Studio console by following the instructions in", @@ -1904,8 +1949,8 @@ "title":"Copying a Script", "uri":"dataartsstudio_01_0430.html", "doc_type":"usermanual", - "p_code":"211", - "code":"212" + "p_code":"216", + "code":"217" }, { "desc":"You can copy the name of a script and rename a script.A script has been developed based on Developing Scripts.Log in to the DataArts Studio console by following the instr", @@ -1913,8 +1958,8 @@ "title":"Copying the Script Name and Renaming a Script", "uri":"dataartsstudio_01_0426.html", "doc_type":"usermanual", - "p_code":"211", - "code":"213" + "p_code":"216", + "code":"218" }, { "desc":"You can move a script file from one directory to another or move a script directory to another directory.A script has been developed based on Developing Scripts.Log in to", @@ -1922,8 +1967,8 @@ "title":"Moving a Script or Script Directory", "uri":"dataartsstudio_01_0427.html", "doc_type":"usermanual", - "p_code":"211", - "code":"214" + "p_code":"216", + "code":"219" }, { "desc":"You can export one or more script files from the script directory. The exported files store the latest content in the development state.Log in to the DataArts Studio cons", @@ -1931,8 +1976,8 @@ "title":"Exporting and Importing Scripts", "uri":"dataartsstudio_01_0428.html", "doc_type":"usermanual", - "p_code":"211", - "code":"215" + "p_code":"216", + "code":"220" }, { "desc":"This section describes how to view the references of a script or all the scripts in a folder.A script has been developed based on Developing Scripts.Log in to the DataArt", @@ -1940,17 +1985,17 @@ "title":"Viewing Script References", "uri":"dataartsstudio_01_0471.html", "doc_type":"usermanual", - "p_code":"211", - "code":"216" + "p_code":"216", + "code":"221" }, { - "desc":"If you do not need to use a script any more, perform the following operations to delete it.When you delete a script, the system checks whether the script is being referen", + "desc":"If you do not need to use a script any longer, perform the following operations to delete it.When you delete a script, the system checks whether the script is being refer", "product_code":"dataartsstudio", "title":"Deleting a Script", "uri":"dataartsstudio_01_0429.html", "doc_type":"usermanual", - "p_code":"211", - "code":"217" + "p_code":"216", + "code":"222" }, { "desc":"Script and job unlocking depends on the lock function of DataArts Factory.The lock function prevents conflict caused by collaborative script or job development. If you cr", @@ -1958,8 +2003,8 @@ "title":"Unlocking a Script", "uri":"dataartsstudio_01_0912.html", "doc_type":"usermanual", - "p_code":"211", - "code":"218" + "p_code":"216", + "code":"223" }, { "desc":"DataArts Factory allows you to change the script owner with a few clicks.Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Stu", @@ -1967,8 +2012,8 @@ "title":"Changing the Script Owner", "uri":"dataartsstudio_01_1102.html", "doc_type":"usermanual", - "p_code":"211", - "code":"219" + "p_code":"216", + "code":"224" }, { "desc":"This section describes how to unlock scripts in batches.Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Cons", @@ -1976,8 +2021,8 @@ "title":"Unlocking Scripts", "uri":"dataartsstudio_01_1107.html", "doc_type":"usermanual", - "p_code":"211", - "code":"220" + "p_code":"216", + "code":"225" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -1985,8 +2030,8 @@ "title":"Job Development", "uri":"dataartsstudio_01_0431.html", "doc_type":"usermanual", - "p_code":"194", - "code":"221" + "p_code":"199", + "code":"226" }, { "desc":"The job development function provides the following capabilities:Provides a graphical designer that allows you to quickly build a data processing workflow by drag-and-dro", @@ -1994,17 +2039,17 @@ "title":"Job Development Process", "uri":"dataartsstudio_01_0432.html", "doc_type":"usermanual", - "p_code":"221", - "code":"222" + "p_code":"226", + "code":"227" }, { - "desc":"A job is composed of one or more nodes that are performed collaboratively to complete data operations. Before developing a job, create a new one.Each workspace can hold a", + "desc":"A job is composed of one or more nodes that are performed collaboratively to complete data operations. Before developing a job, create a new one.A workspace can contain a", "product_code":"dataartsstudio", "title":"Creating a Job", "uri":"dataartsstudio_01_0434.html", "doc_type":"usermanual", - "p_code":"221", - "code":"223" + "p_code":"226", + "code":"228" }, { "desc":"This section describes how to develop and configure a job.For details about how to develop a batch processing job or real-time processing job in pipeline mode, see Compil", @@ -2012,8 +2057,8 @@ "title":"Developing a Pipeline Job", "uri":"dataartsstudio_01_0435.html", "doc_type":"usermanual", - "p_code":"221", - "code":"224" + "p_code":"226", + "code":"229" }, { "desc":"This section describes how to develop and configure a job.For details about how to develop a batch processing job in single-task mode, see sections Developing an SQL Scri", @@ -2021,35 +2066,35 @@ "title":"Developing a Batch Processing Single-Task SQL Job", "uri":"dataartsstudio_01_1436.html", "doc_type":"usermanual", - "p_code":"221", - "code":"225" + "p_code":"226", + "code":"230" }, { "desc":"This section describes how to develop and configure a job.For details about how to develop a real-time processing Flink SQL job in single-task mode, see sections Developi", "product_code":"dataartsstudio", - "title":"Developing a Real-Time Processing Single-Task Flink SQL Job", + "title":"Developing a Real-Time Processing Single-Task MRS Flink SQL Job", "uri":"dataartsstudio_01_1823.html", "doc_type":"usermanual", - "p_code":"221", - "code":"226" + "p_code":"226", + "code":"231" }, { - "desc":"A single-task real-time processing Flink Jar job has been created. For details, see Creating a Job.", + "desc":"A single-task real-time processing Flink Jar job has been created. For details, see Creating a Job.After setting the parameters, click Save and submit the job.Click Start", "product_code":"dataartsstudio", - "title":"Developing a Real-Time Processing Single-Task Flink Jar Job", + "title":"Developing a Real-Time Processing Single-Task MRS Flink Jar Job", "uri":"dataartsstudio_01_1824.html", "doc_type":"usermanual", - "p_code":"221", - "code":"227" + "p_code":"226", + "code":"232" }, { - "desc":"A single-task real-time processing DLI Spark job has been created. For details, see Creating a Job.", + "desc":"A single-task real-time processing DLI Spark job has been created. For details, see Creating a Job.After setting the parameters, click Save and submit the job.Click Start", "product_code":"dataartsstudio", "title":"Developing a Real-Time Processing Single-Task DLI Spark Job", "uri":"dataartsstudio_01_1825.html", "doc_type":"usermanual", - "p_code":"221", - "code":"228" + "p_code":"226", + "code":"233" }, { "desc":"This section describes how to set up scheduling for an orchestrated job.If the processing mode of a job is batch processing, configure scheduling types for jobs. Three sc", @@ -2057,8 +2102,8 @@ "title":"Setting Up Scheduling for a Job", "uri":"dataartsstudio_01_0470.html", "doc_type":"usermanual", - "p_code":"221", - "code":"229" + "p_code":"226", + "code":"234" }, { "desc":"Submitting a version depends on the version management function of DataArts Factory.Version management traces script and job changes, and supports version comparison and ", @@ -2066,17 +2111,17 @@ "title":"Submitting a Version", "uri":"dataartsstudio_01_0902.html", "doc_type":"usermanual", - "p_code":"221", - "code":"230" + "p_code":"226", + "code":"235" }, { - "desc":"In enterprise mode, when a developer submits a job version, the system generates a job release task. After the developer confirms the release task and the admin, deployer", + "desc":"In enterprise mode, when a developer submits a job version, the system generates a job release task. After the developer confirms releasing a package and the admin, deplo", "product_code":"dataartsstudio", "title":"Releasing a Job Task", "uri":"dataartsstudio_01_1903.html", "doc_type":"usermanual", - "p_code":"221", - "code":"231" + "p_code":"226", + "code":"236" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -2084,8 +2129,8 @@ "title":"(Optional) Managing Jobs", "uri":"dataartsstudio_01_0408.html", "doc_type":"usermanual", - "p_code":"221", - "code":"232" + "p_code":"226", + "code":"237" }, { "desc":"This section describes how to copy a job.A job has been developed. For details about how to develop a job, see Developing a Pipeline Job.Log in to the DataArts Studio con", @@ -2093,8 +2138,8 @@ "title":"Copying a Job", "uri":"dataartsstudio_01_0440.html", "doc_type":"usermanual", - "p_code":"232", - "code":"233" + "p_code":"237", + "code":"238" }, { "desc":"You can copy the name of a job and rename a job.A job has been developed. For details about how to develop a job, see Developing a Pipeline Job.Log in to the DataArts Stu", @@ -2102,8 +2147,8 @@ "title":"Copying the Job Name and Renaming a Job", "uri":"dataartsstudio_01_0436.html", "doc_type":"usermanual", - "p_code":"232", - "code":"234" + "p_code":"237", + "code":"239" }, { "desc":"You can move a job file from one directory to another or move a job directory to another directory.A job has been developed. For details about how to develop a job, see D", @@ -2111,8 +2156,8 @@ "title":"Moving a Job or Job Directory", "uri":"dataartsstudio_01_0437.html", "doc_type":"usermanual", - "p_code":"232", - "code":"235" + "p_code":"237", + "code":"240" }, { "desc":"Exporting jobs is to export the latest saved content in the development state.After a job is imported, the content in the development state is overwritten and a new versi", @@ -2120,17 +2165,17 @@ "title":"Exporting and Importing Jobs", "uri":"dataartsstudio_01_0438.html", "doc_type":"usermanual", - "p_code":"232", - "code":"236" + "p_code":"237", + "code":"241" }, { - "desc":"If you do not need to use a job any more, perform the following operations to delete it to reduce the quota usage of the job.Deleted jobs cannot be recovered. Exercise ca", + "desc":"If you do not need to use a job any longer, perform the following operations to delete it to reduce the quota usage of the job.Deleted jobs cannot be recovered. Exercise ", "product_code":"dataartsstudio", "title":"Deleting a Job", "uri":"dataartsstudio_01_0439.html", "doc_type":"usermanual", - "p_code":"232", - "code":"237" + "p_code":"237", + "code":"242" }, { "desc":"Script and job unlocking depends on the lock function of DataArts Factory.The lock function prevents conflict caused by collaborative script or job development. If you cr", @@ -2138,8 +2183,8 @@ "title":"Unlocking a Job", "uri":"dataartsstudio_01_0913.html", "doc_type":"usermanual", - "p_code":"232", - "code":"238" + "p_code":"237", + "code":"243" }, { "desc":"You can view a job dependency graph to learn the upstream and downstream jobs associated with the job.Dependent jobs have been configured in the job scheduling configurat", @@ -2147,8 +2192,8 @@ "title":"Viewing a Job Dependency Graph", "uri":"dataartsstudio_01_1097.html", "doc_type":"usermanual", - "p_code":"232", - "code":"239" + "p_code":"237", + "code":"244" }, { "desc":"DataArts Factory allows you to change the job owner with a few clicks.Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio", @@ -2156,8 +2201,8 @@ "title":"Changing the Job Owner", "uri":"dataartsstudio_01_1101.html", "doc_type":"usermanual", - "p_code":"232", - "code":"240" + "p_code":"237", + "code":"245" }, { "desc":"This section describes how to unlock jobs in batches.Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console", @@ -2165,8 +2210,8 @@ "title":"Unlocking Jobs", "uri":"dataartsstudio_01_1108.html", "doc_type":"usermanual", - "p_code":"232", - "code":"241" + "p_code":"237", + "code":"246" }, { "desc":"From the job directory tree, you can quickly switch to the job monitoring page to view the monitoring details of the job.Log in to the DataArts Studio console by followin", @@ -2174,8 +2219,17 @@ "title":"Going to Monitor Job page", "uri":"dataartsstudio_01_1209.html", "doc_type":"usermanual", - "p_code":"232", - "code":"242" + "p_code":"237", + "code":"247" + }, + { + "desc":"You can configure notifications for a job. Right-click a job name and select Configure Notification. For details, see Configuring Notifications.To modify existing notific", + "product_code":"dataartsstudio", + "title":"Configuring Notifications", + "uri":"dataartsstudio_01_1210.html", + "doc_type":"usermanual", + "p_code":"237", + "code":"248" }, { "desc":"The solution aims to provide users with convenient and systematic management operations and better meet service requirements and objectives. Each solution can contain one", @@ -2183,8 +2237,8 @@ "title":"Solution", "uri":"dataartsstudio_01_0503.html", "doc_type":"usermanual", - "p_code":"194", - "code":"243" + "p_code":"199", + "code":"249" }, { "desc":"This section describes how to view the execution history of scripts, jobs, and nodes over a week.This function depends on OBS buckets. For details about how to configure ", @@ -2192,8 +2246,8 @@ "title":"Execution History", "uri":"dataartsstudio_01_1105.html", "doc_type":"usermanual", - "p_code":"194", - "code":"244" + "p_code":"199", + "code":"250" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -2201,8 +2255,8 @@ "title":"O&M and Scheduling", "uri":"dataartsstudio_01_0505.html", "doc_type":"usermanual", - "p_code":"194", - "code":"245" + "p_code":"199", + "code":"251" }, { "desc":"Choose Monitoring > Overview. On the Overview page, you can view the statistics of job instances in charts. Currently, you can view seven types of statistics:StatusYou ca", @@ -2210,8 +2264,8 @@ "title":"Overview", "uri":"dataartsstudio_01_0506.html", "doc_type":"usermanual", - "p_code":"245", - "code":"246" + "p_code":"251", + "code":"252" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -2219,8 +2273,8 @@ "title":"Monitoring a Job", "uri":"dataartsstudio_01_0413.html", "doc_type":"usermanual", - "p_code":"245", - "code":"247" + "p_code":"251", + "code":"253" }, { "desc":"In the batch processing mode, data is processed periodically in batches based on the job-level scheduling plan, which is used in scenarios with low real-time requirements", @@ -2228,8 +2282,8 @@ "title":"Monitoring a Batch Job", "uri":"dataartsstudio_01_0508.html", "doc_type":"usermanual", - "p_code":"247", - "code":"248" + "p_code":"253", + "code":"254" }, { "desc":"In the real-time processing mode, data is processed in real time, which is used in scenarios with high real-time performance. This type of job is a pipeline that consists", @@ -2237,8 +2291,8 @@ "title":"Monitoring a Real-Time Job", "uri":"dataartsstudio_01_0509.html", "doc_type":"usermanual", - "p_code":"247", - "code":"249" + "p_code":"253", + "code":"255" }, { "desc":"Each time a job is executed, a job instance record is generated. In the navigation pane of the DataArts Factory console, choose Monitoring. On the Monitor Instance page, ", @@ -2246,8 +2300,8 @@ "title":"Instance Monitoring", "uri":"dataartsstudio_01_0511.html", "doc_type":"usermanual", - "p_code":"245", - "code":"250" + "p_code":"251", + "code":"256" }, { "desc":"In the navigation tree of the DataArts Factory console, choose MonitoringMonitor PatchData.On the PatchData Monitoring page, you can view the PatchData job status, date, ", @@ -2255,17 +2309,17 @@ "title":"Monitoring PatchData", "uri":"dataartsstudio_01_0512.html", "doc_type":"usermanual", - "p_code":"245", - "code":"251" + "p_code":"251", + "code":"257" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"Managing Notifications", + "title":"Notification Management", "uri":"dataartsstudio_01_0414.html", "doc_type":"usermanual", - "p_code":"245", - "code":"252" + "p_code":"251", + "code":"258" }, { "desc":"You can configure job notification tasks to notify you of job success or failures.Before configuring a notification for a job:Message notification has been enabled and a ", @@ -2273,8 +2327,8 @@ "title":"Managing Notifications", "uri":"dataartsstudio_01_0514.html", "doc_type":"usermanual", - "p_code":"252", - "code":"253" + "p_code":"258", + "code":"259" }, { "desc":"Notifications can be set to specified personnel by day, week, or month, allowing related personnel to regularly understand job scheduling information about the quantity o", @@ -2282,17 +2336,8 @@ "title":"Cycle Overview", "uri":"dataartsstudio_01_0515.html", "doc_type":"usermanual", - "p_code":"252", - "code":"254" - }, - { - "desc":"You can configure terminal subscriptions (SMS messages, emails, and phone calls) by owner. After configuring a subscription, you can use the Manage Notification function ", - "product_code":"dataartsstudio", - "title":"Managing Terminal Subscriptions", - "uri":"dataartsstudio_01_2515.html", - "doc_type":"usermanual", - "p_code":"252", - "code":"255" + "p_code":"258", + "code":"260" }, { "desc":"You can back up all jobs, scripts, resources, and environment variables at a specified interval.You can also restore assets that have been backed up, including jobs, scri", @@ -2300,8 +2345,8 @@ "title":"Managing Backups", "uri":"dataartsstudio_01_0516.html", "doc_type":"usermanual", - "p_code":"245", - "code":"256" + "p_code":"251", + "code":"261" }, { "desc":"You can view historical operations on the Operation History page. The system stores data for a maximum of three months and automatically deletes older data.Log in to the ", @@ -2309,8 +2354,8 @@ "title":"Operation History", "uri":"dataartsstudio_01_1822.html", "doc_type":"usermanual", - "p_code":"245", - "code":"257" + "p_code":"251", + "code":"262" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -2318,8 +2363,8 @@ "title":"Configuration and Management", "uri":"dataartsstudio_01_0517.html", "doc_type":"usermanual", - "p_code":"194", - "code":"258" + "p_code":"199", + "code":"263" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -2327,8 +2372,8 @@ "title":"Configuring Resources", "uri":"dataartsstudio_01_0510.html", "doc_type":"usermanual", - "p_code":"258", - "code":"259" + "p_code":"263", + "code":"264" }, { "desc":"This topic describes how to configure and use environment variables.Configure job parameters. If a parameter belongs to multiple jobs, you can extract this parameter as a", @@ -2336,8 +2381,8 @@ "title":"Configuring Environment Variables", "uri":"dataartsstudio_01_0504.html", "doc_type":"usermanual", - "p_code":"259", - "code":"260" + "p_code":"264", + "code":"265" }, { "desc":"The execution history of scripts, jobs, and nodes is stored in OBS buckets. If no OBS bucket is available, you cannot view the execution history. This section describes h", @@ -2345,8 +2390,8 @@ "title":"Configuring an OBS Bucket", "uri":"dataartsstudio_01_1106.html", "doc_type":"usermanual", - "p_code":"259", - "code":"261" + "p_code":"264", + "code":"266" }, { "desc":"Job tags are used to label jobs of the same or similar purposes to facilitate job management and query. This section describes how to manage job tags, including adding, d", @@ -2354,8 +2399,8 @@ "title":"Managing Job Tags", "uri":"dataartsstudio_01_0532.html", "doc_type":"usermanual", - "p_code":"259", - "code":"262" + "p_code":"264", + "code":"267" }, { "desc":"The following problems may occur during job execution in DataArts Factory:The job execution mechanism of the DataArts Factory module is to execute the job as the user who", @@ -2363,8 +2408,8 @@ "title":"Configuring a Scheduling Identity", "uri":"dataartsstudio_01_0555.html", "doc_type":"usermanual", - "p_code":"259", - "code":"263" + "p_code":"264", + "code":"268" }, { "desc":"This section describes how to configure the maximum number of job nodes that can run concurrently in a workspace.The number of concurrently running nodes in the workspace", @@ -2372,26 +2417,26 @@ "title":"Configuring the Number of Concurrently Running Nodes", "uri":"dataartsstudio_01_1280.html", "doc_type":"usermanual", - "p_code":"259", - "code":"264" + "p_code":"264", + "code":"269" }, { - "desc":"This section describes how to create and use a Flink SQL template. When writing Flink SQL code, you can use an SQL template for repeated service logic. In addition, you c", + "desc":"This section describes how to create and use a template. When writing code, you can use an SQL template for repeated service logic. In addition, you can use a job paramet", "product_code":"dataartsstudio", "title":"Configuring a Template", "uri":"dataartsstudio_01_1282.html", "doc_type":"usermanual", - "p_code":"259", - "code":"265" + "p_code":"264", + "code":"270" }, { - "desc":"You can configure a scheduling calendar and specify the working days for scheduling a job.This function is available for batch processing jobs but not for real-time proce", + "desc":"You can configure a scheduling calendar and specify the working days for scheduling a job.After creating a scheduling calendar, you can go to the DataArts Factory console", "product_code":"dataartsstudio", "title":"Configuring a Scheduling Calendar", "uri":"dataartsstudio_01_1283.html", "doc_type":"usermanual", - "p_code":"259", - "code":"266" + "p_code":"264", + "code":"271" }, { "desc":"This section describes how to configure a default item. You can perform the operations in this section only if you have the permissions of DARTS Administrator or Tenant A", @@ -2399,8 +2444,8 @@ "title":"Configuring a Default Item", "uri":"dataartsstudio_01_04501.html", "doc_type":"usermanual", - "p_code":"259", - "code":"267" + "p_code":"264", + "code":"272" }, { "desc":"By configuring a task group, you can control the maximum number of concurrent nodes in a task group in a more fine-grained manner.This function is available only for batc", @@ -2408,8 +2453,8 @@ "title":"Configuring Task Groups", "uri":"dataartsstudio_01_1284.html", "doc_type":"usermanual", - "p_code":"259", - "code":"268" + "p_code":"264", + "code":"273" }, { "desc":"You can upload custom code or text files as resources on Manage Resource and schedule them when running nodes. Nodes that can invoke resources include DLI Spark, MRS Spar", @@ -2417,17 +2462,17 @@ "title":"Managing Resources", "uri":"dataartsstudio_01_0519.html", "doc_type":"usermanual", - "p_code":"258", - "code":"269" + "p_code":"263", + "code":"274" }, { - "desc":"For a workspace in simple mode, you can set the reviewer for the scripts and jobs you submit.Only the admin of the current workspace can manage reviewers, including creat", + "desc":"For a workspace in simple mode, you can set the reviewer for the scripts and jobs you submit. In the review center, you can manage applications and configure and maintain", "product_code":"dataartsstudio", "title":"Review Center", "uri":"dataartsstudio_01_1820.html", "doc_type":"usermanual", - "p_code":"194", - "code":"270" + "p_code":"199", + "code":"275" }, { "desc":"You can download or dump SQL script execution results. After downloading or dumping the SQL execution results, you can view them on the Download Center page.Records are g", @@ -2435,8 +2480,8 @@ "title":"Download Center", "uri":"dataartsstudio_01_1821.html", "doc_type":"usermanual", - "p_code":"194", - "code":"271" + "p_code":"199", + "code":"276" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -2444,8 +2489,8 @@ "title":"Node Reference", "uri":"dataartsstudio_01_0441.html", "doc_type":"usermanual", - "p_code":"194", - "code":"272" + "p_code":"199", + "code":"277" }, { "desc":"A node defines the operations performed on data. DataArts Factory provides nodes used for data integration, computing and analysis, database operations, and resource mana", @@ -2453,8 +2498,8 @@ "title":"Node Overview", "uri":"dataartsstudio_01_0442.html", "doc_type":"usermanual", - "p_code":"272", - "code":"273" + "p_code":"277", + "code":"278" }, { "desc":"The CDM Job node is used to run a predefined CDM job for data migration.If you have configured a macro variable of date and time in a CDM job and schedule the CDM job thr", @@ -2462,8 +2507,8 @@ "title":"CDM Job", "uri":"dataartsstudio_01_0443.html", "doc_type":"usermanual", - "p_code":"272", - "code":"274" + "p_code":"277", + "code":"279" }, { "desc":"The Rest Client node is used to respond to RESTful requests in cloud.For details about how to use the Rest Client operator, see Obtaining the Return Value of a Rest Clien", @@ -2471,8 +2516,8 @@ "title":"Rest Client", "uri":"dataartsstudio_01_0447.html", "doc_type":"usermanual", - "p_code":"272", - "code":"275" + "p_code":"277", + "code":"280" }, { "desc":"The Import GES node is used to import files from an OBS bucket to a GES graph.Table 1 and Table 2 describe the parameters of the Import GES node.", @@ -2480,8 +2525,8 @@ "title":"Import GES", "uri":"dataartsstudio_01_0448.html", "doc_type":"usermanual", - "p_code":"272", - "code":"276" + "p_code":"277", + "code":"281" }, { "desc":"The MRS Kafka node is used to query the number of messages that are not consumed by a topic.Table 1 and Table 2 describe the parameters of the MRS Kafka node.", @@ -2489,8 +2534,8 @@ "title":"MRS Kafka", "uri":"dataartsstudio_01_0537.html", "doc_type":"usermanual", - "p_code":"272", - "code":"277" + "p_code":"277", + "code":"282" }, { "desc":"The Kafka Client node is used to send data to Kafka topics.You can learn more about how to use the Kafka Client node in .Table 1 describes the parameters of the Kafka Cli", @@ -2498,8 +2543,8 @@ "title":"Kafka Client", "uri":"dataartsstudio_01_0538.html", "doc_type":"usermanual", - "p_code":"272", - "code":"278" + "p_code":"277", + "code":"283" }, { "desc":"The ROMA FDI Job node executes a predefined ROMA Connect data integration task to implement data integration and conversion between the source and destination.This node e", @@ -2507,26 +2552,26 @@ "title":"ROMA FDI Job", "uri":"dataartsstudio_01_1098.html", "doc_type":"usermanual", - "p_code":"272", - "code":"279" + "p_code":"277", + "code":"284" }, { "desc":"The DLI Flink Job node is used to create and start jobs or check whether DLI jobs are running to analyze streaming big data in real time.After a DLI Flink streaming job i", "product_code":"dataartsstudio", - "title":"DLI Flink Job", + "title":"DLI Flink Job", "uri":"dataartsstudio_01_0536.html", "doc_type":"usermanual", - "p_code":"272", - "code":"280" + "p_code":"277", + "code":"285" }, { - "desc":"The DLI SQL node is used to transfer SQL statements to DLI for data source analysis and exploration.This node enables you to execute DLI statements during periodical or r", + "desc":"The DLI SQL node is used to transfer SQL statements to DLI SQL for data source analysis and exploration.This node enables you to execute DLI statements during periodical ", "product_code":"dataartsstudio", "title":"DLI SQL", "uri":"dataartsstudio_01_0450.html", "doc_type":"usermanual", - "p_code":"272", - "code":"281" + "p_code":"277", + "code":"286" }, { "desc":"The DLI Spark node is used to execute a predefined Spark job.For details about how to use the DLI Spark node, see Developing a DLI Spark Job.Table 1, Table 2, and Table 3", @@ -2534,8 +2579,8 @@ "title":"DLI Spark", "uri":"dataartsstudio_01_0451.html", "doc_type":"usermanual", - "p_code":"272", - "code":"282" + "p_code":"277", + "code":"287" }, { "desc":"The DWS SQL node is used to transfer SQL statements to DWS.For details about how to use the DWS SQL operator, see Developing a DWS SQL Job.This node enables you to execut", @@ -2543,8 +2588,8 @@ "title":"DWS SQL", "uri":"dataartsstudio_01_0452.html", "doc_type":"usermanual", - "p_code":"272", - "code":"283" + "p_code":"277", + "code":"288" }, { "desc":"The MRS Spark SQL node is used to execute a predefined SparkSQL statement on MRS.Table 1, Table 2, and Table 3 describe the parameters of the MRS Spark SQLnode node.", @@ -2552,8 +2597,8 @@ "title":"MRS Spark SQL", "uri":"dataartsstudio_01_0453.html", "doc_type":"usermanual", - "p_code":"272", - "code":"284" + "p_code":"277", + "code":"289" }, { "desc":"The MRS Hive SQL node is used to execute a predefined Hive SQL script in DataArts Factory.For details about how to use the MRS Hive SQL node, see Developing a Hive SQL Jo", @@ -2561,8 +2606,8 @@ "title":"MRS Hive SQL", "uri":"dataartsstudio_01_0454.html", "doc_type":"usermanual", - "p_code":"272", - "code":"285" + "p_code":"277", + "code":"290" }, { "desc":"The MRS Presto SQL node is used to execute the Presto SQL script predefined in DataArts Factory.Table 1, Table 2, and Table 3 describe the parameters of the MRS Presto SQ", @@ -2570,8 +2615,8 @@ "title":"MRS Presto SQL", "uri":"dataartsstudio_01_1099.html", "doc_type":"usermanual", - "p_code":"272", - "code":"286" + "p_code":"277", + "code":"291" }, { "desc":"The MRS Spark node is used to execute a predefined Spark job on MRS.Table 1, Table 2, and Table 3 describe the parameters of the MRS Sparknode node.", @@ -2579,8 +2624,8 @@ "title":"MRS Spark", "uri":"dataartsstudio_01_0455.html", "doc_type":"usermanual", - "p_code":"272", - "code":"287" + "p_code":"277", + "code":"292" }, { "desc":"The MRS Spark Python node is used to execute a predefined Spark Python job on MRS.For details about how to use the MRS Spark Python operator, see Developing an MRS Spark ", @@ -2588,8 +2633,26 @@ "title":"MRS Spark Python", "uri":"dataartsstudio_01_0456.html", "doc_type":"usermanual", - "p_code":"272", - "code":"288" + "p_code":"277", + "code":"293" + }, + { + "desc":"The MRS ClickHouse node is used to execute the ClickHouse SQL script predefined in DataArts Factory.Table 1, Table 2, and Table 3 describe the parameters of the MRS Click", + "product_code":"dataartsstudio", + "title":"MRS ClickHouse", + "uri":"dataartsstudio_01_0528.html", + "doc_type":"usermanual", + "p_code":"277", + "code":"294" + }, + { + "desc":"The MRS Impala SQL node is used to execute the Impala SQL script predefined in DataArts Factory.Table 1 and Table 2 describe the parameters of the MRS Impala node.", + "product_code":"dataartsstudio", + "title":"MRS Impala SQL", + "uri":"dataartsstudio_01_1104.html", + "doc_type":"usermanual", + "p_code":"277", + "code":"295" }, { "desc":"The MRS Flink Job node is used to execute the Flink SQL script and Flink job predefined in DataArts Factory.Table 1 and Table 2 describe the parameters of the MRS Flink n", @@ -2597,8 +2660,8 @@ "title":"MRS Flink Job", "uri":"dataartsstudio_01_0554.html", "doc_type":"usermanual", - "p_code":"272", - "code":"289" + "p_code":"277", + "code":"296" }, { "desc":"The MRS MapReduce node is used to execute a predefined MapReduce program on MRS.Table 1 and Table 2 describe the parameters of the MRS MapReduce node.", @@ -2606,8 +2669,8 @@ "title":"MRS MapReduce", "uri":"dataartsstudio_01_0457.html", "doc_type":"usermanual", - "p_code":"272", - "code":"290" + "p_code":"277", + "code":"297" }, { "desc":"The CSS node is used to process CSS requests and enable online distributed searching.Table 1 and Table 2 describe the parameters of the CSS node.", @@ -2615,8 +2678,8 @@ "title":"CSS", "uri":"dataartsstudio_01_0458.html", "doc_type":"usermanual", - "p_code":"272", - "code":"291" + "p_code":"277", + "code":"298" }, { "desc":"The Shell node is used to execute a shell script.With EL expression #{Job.getNodeOutput()}, you can obtain the desired content (4000 characters at most and counted backwa", @@ -2624,8 +2687,8 @@ "title":"Shell", "uri":"dataartsstudio_01_0459.html", "doc_type":"usermanual", - "p_code":"272", - "code":"292" + "p_code":"277", + "code":"299" }, { "desc":"The RDS SQL node is used to transfer SQL statements to RDS.Table 1 and Table 2 describe the parameters of the RDS SQL node.", @@ -2633,8 +2696,8 @@ "title":"RDS SQL", "uri":"dataartsstudio_01_0460.html", "doc_type":"usermanual", - "p_code":"272", - "code":"293" + "p_code":"277", + "code":"300" }, { "desc":"The ETL Job node is used to extract data from a specified data source, preprocess the data, and import the data to the target data source.The destination is the ETL Job n", @@ -2642,8 +2705,8 @@ "title":"ETL Job", "uri":"dataartsstudio_01_0461.html", "doc_type":"usermanual", - "p_code":"272", - "code":"294" + "p_code":"277", + "code":"301" }, { "desc":"Before using a Python node, ensure that the host connected to the node has an environment for executing Python scripts.The Python node is used to execute Python statement", @@ -2651,8 +2714,17 @@ "title":"Python", "uri":"dataartsstudio_01_4504.html", "doc_type":"usermanual", - "p_code":"272", - "code":"295" + "p_code":"277", + "code":"302" + }, + { + "desc":"The Doris SQL node transfers SQL statements to Doris for execution.Table 1 and Table 2 describe the parameters of the Doris SQL node.", + "product_code":"dataartsstudio", + "title":"DORIS SQL", + "uri":"dataartsstudio_01_4509.html", + "doc_type":"usermanual", + "p_code":"277", + "code":"303" }, { "desc":"You can orchestrate ModelArts Train operators to schedule the ModelArts workflow in DataArts Studio.Table 1 and Table 2 describe the parameters of the ModelArts Train nod", @@ -2660,17 +2732,8 @@ "title":"ModelArts Train", "uri":"dataartsstudio_01_4500.html", "doc_type":"usermanual", - "p_code":"272", - "code":"296" - }, - { - "desc":"Http Trigger is a cross-platform scheduling trigger node of DataArts Studio. If you want to trigger a job on DataArts Studio after a job on another scheduling system is c", - "product_code":"dataartsstudio", - "title":"Http Trigger", - "uri":"dataartsstudio_01_0489.html", - "doc_type":"usermanual", - "p_code":"272", - "code":"297" + "p_code":"277", + "code":"304" }, { "desc":"The OBS path cannot be a log path starting with s3a://.This function depends on OBS.The Create OBS node is used to create buckets and directories on OBS.Table 1 and Table", @@ -2678,8 +2741,8 @@ "title":"Create OBS", "uri":"dataartsstudio_01_0462.html", "doc_type":"usermanual", - "p_code":"272", - "code":"298" + "p_code":"277", + "code":"305" }, { "desc":"This function depends on OBS.The Delete OBS node is used to delete a bucket or directory on OBS.Table 1 and Table 2 describe the parameters of the Delete OBS node.", @@ -2687,8 +2750,8 @@ "title":"Delete OBS", "uri":"dataartsstudio_01_0463.html", "doc_type":"usermanual", - "p_code":"272", - "code":"299" + "p_code":"277", + "code":"306" }, { "desc":"This function depends on OBS.The OBS Manager node is used to move or copy files from an OBS bucket to a specified directory.Table 1, Table 2, and Table 3 describe the par", @@ -2696,17 +2759,17 @@ "title":"OBS Manager", "uri":"dataartsstudio_01_0464.html", "doc_type":"usermanual", - "p_code":"272", - "code":"300" + "p_code":"277", + "code":"307" }, { - "desc":"You can use the Open/Close Resource node to enable or disable cloud services as required.Table 1 and Table 2 describe the parameters of the Open/Close Resource node.", + "desc":"You can use the Open/Close Resource node to enable or disable services as required.Table 1 and Table 2 describe the parameters of the Open/Close Resource node.", "product_code":"dataartsstudio", "title":"Open/Close Resource", "uri":"dataartsstudio_01_0465.html", "doc_type":"usermanual", - "p_code":"272", - "code":"301" + "p_code":"277", + "code":"308" }, { "desc":"The Subjob node is used to call the batch job that does not contain the subjob node.Table 1 and Table 2 describe the parameters of the Subjob node.", @@ -2714,8 +2777,8 @@ "title":"Subjob", "uri":"dataartsstudio_01_0467.html", "doc_type":"usermanual", - "p_code":"272", - "code":"302" + "p_code":"277", + "code":"309" }, { "desc":"The For Each node specifies a subjob to be executed cyclically and assigns values to variables in a subjob with a dataset.When a For Each node is executed once, a specifi", @@ -2723,8 +2786,8 @@ "title":"For Each", "uri":"dataartsstudio_01_0535.html", "doc_type":"usermanual", - "p_code":"272", - "code":"303" + "p_code":"277", + "code":"310" }, { "desc":"The SMN node is used to send notifications to users.Table 1 and Table 2 describe the parameters of the SMN node.", @@ -2732,8 +2795,8 @@ "title":"SMN", "uri":"dataartsstudio_01_0468.html", "doc_type":"usermanual", - "p_code":"272", - "code":"304" + "p_code":"277", + "code":"311" }, { "desc":"The Dummy node is empty and does not perform any operations. It is used to simplify the complex connection relationships of nodes. Figure 1 shows an example.Table 1 descr", @@ -2741,8 +2804,8 @@ "title":"Dummy", "uri":"dataartsstudio_01_0469.html", "doc_type":"usermanual", - "p_code":"272", - "code":"305" + "p_code":"277", + "code":"312" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -2750,8 +2813,8 @@ "title":"EL Expression Reference", "uri":"dataartsstudio_01_0493.html", "doc_type":"usermanual", - "p_code":"194", - "code":"306" + "p_code":"199", + "code":"313" }, { "desc":"Node parameter values in a DataArts Factory job can be dynamically generated based on the running environment by using Expression Language (EL). You can determine whether", @@ -2759,8 +2822,8 @@ "title":"Expression Overview", "uri":"dataartsstudio_01_0494.html", "doc_type":"usermanual", - "p_code":"306", - "code":"307" + "p_code":"313", + "code":"314" }, { "desc":"EL supports most of the arithmetic and logic operators provided by Java.If variable a is empty, default is returned. If variable a is not empty, a itself is returned. The", @@ -2768,8 +2831,8 @@ "title":"Basic Operators", "uri":"dataartsstudio_01_0495.html", "doc_type":"usermanual", - "p_code":"306", - "code":"308" + "p_code":"313", + "code":"315" }, { "desc":"The date and time in the EL expression can be displayed in a user-specified format. The date and time format is specified by the date and time mode character string. The ", @@ -2777,8 +2840,8 @@ "title":"Date and Time Mode", "uri":"dataartsstudio_01_0496.html", "doc_type":"usermanual", - "p_code":"306", - "code":"309" + "p_code":"313", + "code":"316" }, { "desc":"An Env embedded object provides a method of obtaining an environment variable value.The EL expression used to obtain the value of environment variable test is as follows:", @@ -2786,8 +2849,8 @@ "title":"Env Embedded Objects", "uri":"dataartsstudio_01_0497.html", "doc_type":"usermanual", - "p_code":"306", - "code":"310" + "p_code":"313", + "code":"317" }, { "desc":"A job object provides properties and methods of obtaining the output message, job scheduling plan time, and job execution time of the previous node in a job.The expressio", @@ -2795,8 +2858,8 @@ "title":"Job Embedded Objects", "uri":"dataartsstudio_01_0498.html", "doc_type":"usermanual", - "p_code":"306", - "code":"311" + "p_code":"313", + "code":"318" }, { "desc":"A StringUtil embedded object provides methods of operating character strings, for example, truncating a substring from a character string.StringUtil is implemented throug", @@ -2804,8 +2867,8 @@ "title":"StringUtil Embedded Objects", "uri":"dataartsstudio_01_0499.html", "doc_type":"usermanual", - "p_code":"306", - "code":"312" + "p_code":"313", + "code":"319" }, { "desc":"A DateUtil embedded object provides methods of formatting time and calculating time.The previous day of the job scheduling plan time is used as the subdirectory name to g", @@ -2813,8 +2876,8 @@ "title":"DateUtil Embedded Objects", "uri":"dataartsstudio_01_0500.html", "doc_type":"usermanual", - "p_code":"306", - "code":"313" + "p_code":"313", + "code":"320" }, { "desc":"A JSONUtil embedded object provides JSON object methods.The content of variable str is as follows:The expression for obtaining the area code of city1 is as follows:", @@ -2822,8 +2885,8 @@ "title":"JSONUtil Embedded Objects", "uri":"dataartsstudio_01_0501.html", "doc_type":"usermanual", - "p_code":"306", - "code":"314" + "p_code":"313", + "code":"321" }, { "desc":"You can use Loop embedded objects to obtain data from the For Each node.To obtain the second value of a row that is being processed, use the following EL expression:", @@ -2831,8 +2894,8 @@ "title":"Loop Embedded Objects", "uri":"dataartsstudio_01_0534.html", "doc_type":"usermanual", - "p_code":"306", - "code":"315" + "p_code":"313", + "code":"322" }, { "desc":"The OBSUtil embedded objects provide a series of OBS operation methods, for example, checking whether an OBS file or directory exists.The following is the EL expression f", @@ -2840,8 +2903,8 @@ "title":"OBSUtil Embedded Objects", "uri":"dataartsstudio_01_0553.html", "doc_type":"usermanual", - "p_code":"306", - "code":"316" + "p_code":"313", + "code":"323" }, { "desc":"This section describes common EL expressions and examples.", @@ -2849,8 +2912,8 @@ "title":"Examples of Common EL Expressions", "uri":"dataartsstudio_01_4803.html", "doc_type":"usermanual", - "p_code":"306", - "code":"317" + "p_code":"313", + "code":"324" }, { "desc":"With this example, you can understand how to use EL expressions in the following applications:Using variables in the SQL script of DataArts FactoryTransferring parameters", @@ -2858,8 +2921,8 @@ "title":"EL Expression Use Examples", "uri":"dataartsstudio_01_0502.html", "doc_type":"usermanual", - "p_code":"306", - "code":"318" + "p_code":"313", + "code":"325" }, { "desc":"The simple variable set provides a series of customized variables. Customized parameters are automatically replaced with specific values based on the service date, plan t", @@ -2867,8 +2930,8 @@ "title":"Simple Variable Set", "uri":"dataartsstudio_01_0556.html", "doc_type":"usermanual", - "p_code":"194", - "code":"319" + "p_code":"199", + "code":"326" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -2876,8 +2939,8 @@ "title":"Usage Guidance", "uri":"dataartsstudio_01_0520.html", "doc_type":"usermanual", - "p_code":"194", - "code":"320" + "p_code":"199", + "code":"327" }, { "desc":"This section describes how to reference parameters in scripts and jobs, application scope of the referenced parameters, and whether EL expressions and simple variable set", @@ -2885,8 +2948,8 @@ "title":"Referencing Parameters in Scripts and Jobs", "uri":"dataartsstudio_01_7524.html", "doc_type":"usermanual", - "p_code":"320", - "code":"321" + "p_code":"327", + "code":"328" }, { "desc":"When configuring job scheduling, you can set the scheduling time to the last day of each month using either of the two methods provided in the following table.In DataArts", @@ -2894,8 +2957,8 @@ "title":"Setting the Job Scheduling Time to the Last Day of Each Month", "uri":"dataartsstudio_01_7523.html", "doc_type":"usermanual", - "p_code":"320", - "code":"322" + "p_code":"327", + "code":"329" }, { "desc":"This section describes how to configure a job that is scheduled at a specified time of a year.In DataArts Studio, create a job that is scheduled every month and add an em", @@ -2903,8 +2966,8 @@ "title":"Configuring a Yearly Scheduled Job", "uri":"dataartsstudio_01_7564.html", "doc_type":"usermanual", - "p_code":"320", - "code":"323" + "p_code":"327", + "code":"330" }, { "desc":"In the migration of a project, if you want to supplement historical business data in a previous period and view details of the historical data, PatchData can meet your re", @@ -2912,8 +2975,8 @@ "title":"Using PatchData", "uri":"dataartsstudio_01_0585.html", "doc_type":"usermanual", - "p_code":"320", - "code":"324" + "p_code":"327", + "code":"331" }, { "desc":"This section describes how to obtain the output of an SQL node and apply the output to subsequent nodes or judgment in job development.When you use EL expression #{Job.ge", @@ -2921,8 +2984,8 @@ "title":"Obtaining the Output of an SQL Node", "uri":"dataartsstudio_01_0584.html", "doc_type":"usermanual", - "p_code":"320", - "code":"325" + "p_code":"327", + "code":"332" }, { "desc":"You can run a query SQL statement to transfer the obtained maximum time value to a CDM job. In the advanced attributes of the CDM job, the where clause is used to determi", @@ -2930,8 +2993,8 @@ "title":"Obtaining the Maximum Value and Transferring It to a CDM Job Using a Query SQL Statement", "uri":"dataartsstudio_01_1584.html", "doc_type":"usermanual", - "p_code":"320", - "code":"326" + "p_code":"327", + "code":"333" }, { "desc":"When developing and orchestrating jobs in DataArts Factory, you can use IF statements to determine the branch to execute.This section describes how to use IF statements i", @@ -2939,8 +3002,8 @@ "title":"IF Statements", "uri":"dataartsstudio_01_0583.html", "doc_type":"usermanual", - "p_code":"320", - "code":"327" + "p_code":"327", + "code":"334" }, { "desc":"The Rest Client node can execute RESTful requests.This tutorial describes how to obtain the return value of the Rest Client node, covering the following two application s", @@ -2948,8 +3011,8 @@ "title":"Obtaining the Return Value of a Rest Client Node", "uri":"dataartsstudio_01_0581.html", "doc_type":"usermanual", - "p_code":"320", - "code":"328" + "p_code":"327", + "code":"335" }, { "desc":"During job development, if some jobs have different parameters but the same processing logic, you can use For Each nodes to avoid repeated job development.You can use a F", @@ -2957,8 +3020,8 @@ "title":"Using For Each Nodes", "uri":"dataartsstudio_01_0582.html", "doc_type":"usermanual", - "p_code":"320", - "code":"329" + "p_code":"327", + "code":"336" }, { "desc":"This function applies to the following scenarios:Use a script template for a Flink SQL script.During pipeline job development, use a Fink SQL script which uses a script t", @@ -2966,8 +3029,8 @@ "title":"Using Script Templates and Parameter Templates", "uri":"dataartsstudio_01_1582.html", "doc_type":"usermanual", - "p_code":"320", - "code":"330" + "p_code":"327", + "code":"337" }, { "desc":"This section describes how to develop and execute a Python job using DataArts Factory.An ECS named ecs-dgc has been created.In this example, the ECS uses the CentOS 8.0 6", @@ -2975,8 +3038,8 @@ "title":"Developing a Python Job", "uri":"dataartsstudio_01_0529.html", "doc_type":"usermanual", - "p_code":"320", - "code":"331" + "p_code":"327", + "code":"338" }, { "desc":"This section describes how to use the DWS SQL node to develop a job in DataArts Factory.This tutorial describes how to develop a DWS job to collect the sales volume of a ", @@ -2984,8 +3047,8 @@ "title":"Developing a DWS SQL Job", "uri":"dataartsstudio_01_0524.html", "doc_type":"usermanual", - "p_code":"320", - "code":"332" + "p_code":"327", + "code":"339" }, { "desc":"This section introduces how to develop Hive SQL scripts on DataArts Factory.As a one-stop big data development platform, DataArts Factory supports development of multiple", @@ -2993,8 +3056,8 @@ "title":"Developing a Hive SQL Job", "uri":"dataartsstudio_01_0522.html", "doc_type":"usermanual", - "p_code":"320", - "code":"333" + "p_code":"327", + "code":"340" }, { "desc":"This section introduces how to develop a DLI Spark job on DataArts Factory.In most cases, SQL is used to analyze and process data when using Data Lake Insight (DLI). Howe", @@ -3002,8 +3065,8 @@ "title":"Developing a DLI Spark Job", "uri":"dataartsstudio_01_0521.html", "doc_type":"usermanual", - "p_code":"320", - "code":"334" + "p_code":"327", + "code":"341" }, { "desc":"This section describes how to develop an MRS Spark Python on DataArts Factory.PrerequisitesYou have the permission to access OBS paths.Data preparationPrepare the script ", @@ -3011,8 +3074,8 @@ "title":"Developing an MRS Spark Python Job", "uri":"dataartsstudio_01_0525.html", "doc_type":"usermanual", - "p_code":"320", - "code":"335" + "p_code":"327", + "code":"342" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -3020,8 +3083,8 @@ "title":"Audit Log", "uri":"dataartsstudio_01_1200.html", "doc_type":"usermanual", - "p_code":"25", - "code":"336" + "p_code":"11", + "code":"343" }, { "desc":"You can use Cloud Trace Service (CTS) to record key operation events related to DataArts Studio. The events can be used in various scenarios such as security analysis, co", @@ -3029,8 +3092,8 @@ "title":"Viewing Traces", "uri":"dataartsstudio_01_0127.html", "doc_type":"usermanual", - "p_code":"336", - "code":"337" + "p_code":"343", + "code":"344" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -3038,8 +3101,8 @@ "title":"Key Operations Recorded by CTS", "uri":"dataartsstudio_01_1207.html", "doc_type":"usermanual", - "p_code":"336", - "code":"338" + "p_code":"343", + "code":"345" }, { "desc":"CTS provides records of operations on cloud service resources. With CTS, you can query, audit, and backtrack those operations.", @@ -3047,17 +3110,17 @@ "title":"Management Center Operations", "uri":"dataartsstudio_01_1201.html", "doc_type":"usermanual", - "p_code":"338", - "code":"339" + "p_code":"345", + "code":"346" }, { "desc":"CTS provides records of operations on cloud service resources. With CTS, you can query, audit, and backtrack those operations.", "product_code":"dataartsstudio", - "title":"DataArts Migration Operations", + "title":"Key CDM Operations Recorded by CTS", "uri":"dataartsstudio_01_0126.html", "doc_type":"usermanual", - "p_code":"338", - "code":"340" + "p_code":"345", + "code":"347" }, { "desc":"CTS provides records of operations on cloud service resources. With CTS, you can query, audit, and backtrack those operations.", @@ -3065,8 +3128,8 @@ "title":"DataArts Factory Operations", "uri":"dataartsstudio_01_1203.html", "doc_type":"usermanual", - "p_code":"338", - "code":"341" + "p_code":"345", + "code":"348" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -3075,7 +3138,7 @@ "uri":"dataartsstudio_12_0007.html", "doc_type":"usermanual", "p_code":"", - "code":"342" + "code":"349" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -3083,26 +3146,17 @@ "title":"Consultation and Billing", "uri":"dataartsstudio_03_0001.html", "doc_type":"usermanual", - "p_code":"342", - "code":"343" + "p_code":"349", + "code":"350" }, { "desc":"We use a region to identify the location of a data center. You can create resources in a specific region.A region is a physical data center. Each region is completely ind", "product_code":"dataartsstudio", - "title":"Regions", + "title":"How Do I Select a Region?", "uri":"dataartsstudio_03_0052.html", "doc_type":"usermanual", - "p_code":"343", - "code":"344" - }, - { - "desc":"Check whether a user has been added to the workspace. If no, perform the following steps to add the user.", - "product_code":"dataartsstudio", - "title":"What Should I Do If a User Cannot View Workspaces After I Have Assigned the Required Policy to the User?", - "uri":"dataartsstudio_03_0061.html", - "doc_type":"usermanual", - "p_code":"343", - "code":"345" + "p_code":"350", + "code":"351" }, { "desc":"In DataArts Studio, system roles and workspace roles are used to assign permissions. By default, if a user is assigned the DARTS User system role but not a workspace role", @@ -3110,17 +3164,26 @@ "title":"How Do I Isolate Workspaces So That Users Cannot View Unauthorized Workspaces?", "uri":"dataartsstudio_03_0158.html", "doc_type":"usermanual", - "p_code":"343", - "code":"346" + "p_code":"350", + "code":"352" }, { - "desc":"Yes. The procedure is as follows.To prevent service loss caused by mis-deletion, the system allows only the DARTS Administrator or Tenant Administrator to delete workspac", + "desc":"If you assign only the DARTS User system role but not a workspace role to a user, the user cannot access a workspace and an error message is displayed.Check whether the u", + "product_code":"dataartsstudio", + "title":"What Should I Do If a User Cannot View Workspaces After I Have Assigned the Required Policy to the User?", + "uri":"dataartsstudio_03_0061.html", + "doc_type":"usermanual", + "p_code":"350", + "code":"353" + }, + { + "desc":"Yes. The procedure is as follows.Mis-deletion may result in service loss. To delete a workspace, you must use the DARTS Administrator or Tenant Administrator account and ", "product_code":"dataartsstudio", "title":"Can I Delete DataArts Studio Workspaces?", "uri":"dataartsstudio_03_0222.html", "doc_type":"usermanual", - "p_code":"343", - "code":"347" + "p_code":"350", + "code":"354" }, { "desc":"No. Purchased or trial instances cannot be transferred to another account.", @@ -3128,17 +3191,17 @@ "title":"Can I Transfer a Purchased or Trial Instance to Another Account?", "uri":"dataartsstudio_03_0131.html", "doc_type":"usermanual", - "p_code":"343", - "code":"348" + "p_code":"350", + "code":"355" }, { - "desc":"No. You cannot downgrade a purchased DataArts Studio instance.", + "desc":"The version of a created DataArts Studio instance cannot be directly downgraded.However, you can downgrade the version by creating an instance of an earlier version, migr", "product_code":"dataartsstudio", "title":"Does DataArts Studio Support Version Downgrade?", "uri":"dataartsstudio_03_0087.html", "doc_type":"usermanual", - "p_code":"343", - "code":"349" + "p_code":"350", + "code":"356" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -3146,89 +3209,89 @@ "title":"Management Center", "uri":"dataartsstudio_03_0022.html", "doc_type":"usermanual", - "p_code":"342", - "code":"350" + "p_code":"349", + "code":"357" }, { - "desc":"For details about the data connections supported by DataArts Studio, see Data Sources Supported by DataArts Studio.", + "desc":"DataArts Studio can interconnect with cloud services such as GaussDB(DWS), DLI, and MRS Hive as well as traditional databases such as MySQL and . For details, see Data So", "product_code":"dataartsstudio", - "title":"Which Data Connections Are Supported by DataArts Studio?", + "title":"Which Data Sources Can DataArts Studio Connect To?", "uri":"dataartsstudio_03_0008.html", "doc_type":"usermanual", - "p_code":"350", - "code":"351" + "p_code":"357", + "code":"358" }, { - "desc":"When creating a DWS, MRS Hive, RDS, and SparkSQL data connection, you must bind an agent provided by the CDM cluster. Currently, a version of the CDM cluster earlier than", + "desc":"RDS data connections depend on OBS. If OBS is unavailable in the same region as DataArts Studio, RDS data connections are not supported.For host connections, only Linux h", "product_code":"dataartsstudio", "title":"What Are the Precautions for Creating Data Connections?", "uri":"dataartsstudio_03_0009.html", "doc_type":"usermanual", - "p_code":"350", - "code":"352" + "p_code":"357", + "code":"359" }, { "desc":"The possible cause is that the CDM cluster is stopped or a concurrency conflict occurs. You can switch to another agent to temporarily avoid this issue.To resolve this is", "product_code":"dataartsstudio", - "title":"Why Do DWS/Hive/HBase Data Connections Fail to Obtain the Information About Database or Tables?", + "title":"What Should I Do If Database or Table Information Cannot Be Obtained Through a GaussDB(DWS)/Hive/HBase Data Connection?", "uri":"dataartsstudio_03_0016.html", "doc_type":"usermanual", - "p_code":"350", - "code":"353" + "p_code":"357", + "code":"360" }, { - "desc":"Possible causes are as follows:Hive/HBase components were not selected during MRS cluster creation.The network between the CDM cluster and MRS cluster was disconnected wh", + "desc":"Possible causes are as follows:Hive/HBase components were not selected during MRS cluster creation.The enterprise project selected during MRS cluster creation is differen", "product_code":"dataartsstudio", "title":"Why Are MRS Hive/HBase Clusters Not Displayed on the Page for Creating Data Connections?", "uri":"dataartsstudio_03_0017.html", "doc_type":"usermanual", - "p_code":"350", - "code":"354" + "p_code":"357", + "code":"361" }, { - "desc":"The failure may be caused by the rights separation function of the DWS cluster. On the DWS console, click the corresponding cluster, choose Security Settings, and disable", + "desc":"The failure may be caused by the rights separation function of the GaussDB(DWS) cluster.On the DWS console, click the corresponding cluster, choose Security Settings, and", "product_code":"dataartsstudio", - "title":"What Should I Do If the Connection Test Fails When I Enable the SSL Connection During the Creation of a DWS Data Connection?", + "title":"What Should I Do If a GaussDB(DWS) Connection Test Fails When SSL Is Enabled for the Connection?", "uri":"dataartsstudio_03_0054.html", "doc_type":"usermanual", - "p_code":"350", - "code":"355" + "p_code":"357", + "code":"362" }, { - "desc":"Multiple data connections of the same type or different types can be created in the same workspace, but their names must be unique.", + "desc":"Yes, but the name of each connection must be unique.To ensure that you can select the correct data connection in future development, you are advised to name the connectio", "product_code":"dataartsstudio", - "title":"Can I Create Multiple Data Connections in a Workspace in Proxy Mode?", + "title":"Can I Create Multiple Connections to the Same Data Source in a Workspace?", "uri":"dataartsstudio_03_0089.html", "doc_type":"usermanual", - "p_code":"350", - "code":"356" + "p_code":"357", + "code":"363" }, { - "desc":"You are advised to choose a proxy connection.", + "desc":"The API connection type is available only for DataArts Factory.To ensure that a connection is available for other components such as DataArts Architecture, DataArts Quali", "product_code":"dataartsstudio", - "title":"Should I Choose a Direct or a Proxy Connection When Creating a DWS Connection?", + "title":"Should I Select the API or Proxy Connection Type When Creating a Data Connection in Management Center?", "uri":"dataartsstudio_03_0137.html", "doc_type":"usermanual", - "p_code":"350", - "code":"357" + "p_code":"357", + "code":"364" }, { - "desc":"You can export the jobs in DataArts Factory and then import them to DataArts Factory in another workspace.You can export data connections on the Migrate Resources page of", + "desc":"You can export data connections and jobs from one workspace and import them to another workspace.Export and import data connections in Management Center.Export and import", "product_code":"dataartsstudio", "title":"How Do I Migrate the Data Development Jobs and Data Connections from One Workspace to Another?", "uri":"dataartsstudio_03_0153.html", "doc_type":"usermanual", - "p_code":"350", - "code":"358" + "p_code":"357", + "code":"365" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", "product_code":"dataartsstudio", - "title":"DataArts Migration", + "title":"DataArts Migration (CDM Jobs)", "uri":"dataartsstudio_03_0027.html", "doc_type":"usermanual", - "p_code":"342", - "code":"359" + "p_code":"349", + "code":"366" }, { "desc":"CDM is developed based on a distributed computing framework and leverages the parallel data processing technology. Table 1 details the advantages of CDM.", @@ -3236,8 +3299,8 @@ "title":"What Are the Advantages of CDM?", "uri":"dataartsstudio_03_0139.html", "doc_type":"usermanual", - "p_code":"359", - "code":"360" + "p_code":"366", + "code":"367" }, { "desc":"CDM is a fully hosted service that provides the following capabilities to protect user data security:Instance isolation: CDM users can use only their own instances. Insta", @@ -3245,8 +3308,8 @@ "title":"What Are the Security Protection Mechanisms of CDM?", "uri":"dataartsstudio_03_0140.html", "doc_type":"usermanual", - "p_code":"359", - "code":"361" + "p_code":"366", + "code":"368" }, { "desc":"When migrating the data on the public network, use NAT Gateway to share the EIPs with other ECSs in the subnet. In this way, data on the on-premises data center or third-", @@ -3254,8 +3317,8 @@ "title":"How Do I Reduce the Cost of Using CDM?", "uri":"dataartsstudio_03_0099.html", "doc_type":"usermanual", - "p_code":"359", - "code":"362" + "p_code":"366", + "code":"369" }, { "desc":"No. To use a later version cluster, you can create one.", @@ -3263,8 +3326,8 @@ "title":"Can I Upgrade a CDM Cluster?", "uri":"dataartsstudio_03_0302.html", "doc_type":"usermanual", - "p_code":"359", - "code":"363" + "p_code":"366", + "code":"370" }, { "desc":"Theoretically, a cdm.large CDM instance can migrate 1 TB to 8 TB data per day. The actual transmission rate is affected by factors such as the Internet bandwidth, cluster", @@ -3272,8 +3335,8 @@ "title":"How Is the Migration Performance of CDM?", "uri":"dataartsstudio_03_0141.html", "doc_type":"usermanual", - "p_code":"359", - "code":"364" + "p_code":"366", + "code":"371" }, { "desc":"CDM migrates data through data migration jobs. It works in the following way:When data migration jobs are submitted, CDM splits each job into multiple tasks based on the ", @@ -3281,17 +3344,17 @@ "title":"What Is the Number of Concurrent Jobs for Different CDM Cluster Versions?", "uri":"dataartsstudio_03_0124.html", "doc_type":"usermanual", - "p_code":"359", - "code":"365" + "p_code":"366", + "code":"372" }, { - "desc":"CDM supports incremental data migration. With scheduled jobs and macro variables of date and time, CDM provides incremental data migration in the following scenarios:Incr", + "desc":"Does CDM support incremental data migration?CDM supports incremental data migration.With scheduled jobs and macro variables of date and time, CDM provides incremental dat", "product_code":"dataartsstudio", "title":"Does CDM Support Incremental Data Migration?", "uri":"dataartsstudio_03_0069.html", "doc_type":"usermanual", - "p_code":"359", - "code":"366" + "p_code":"366", + "code":"373" }, { "desc":"Yes. CDM supports the following field converters:AnonymizationTrimReverse StringReplace StringExpression ConversionYou can create a field converter on the Map Field page ", @@ -3299,8 +3362,8 @@ "title":"Does CDM Support Field Conversion?", "uri":"dataartsstudio_03_0028.html", "doc_type":"usermanual", - "p_code":"359", - "code":"367" + "p_code":"366", + "code":"374" }, { "desc":"The recommended component versions can be used as both the source and destination.", @@ -3308,62 +3371,62 @@ "title":"What Component Versions Are Recommended for Migrating Hadoop Data Sources?", "uri":"dataartsstudio_03_0107.html", "doc_type":"usermanual", - "p_code":"359", - "code":"368" + "p_code":"366", + "code":"375" }, { - "desc":"CDM can read and write data in SequenceFile, TextFile, ORC, or Parquet format from the Hive data source.", + "desc":"Which data formats are supported when the data source is Hive?CDM can read and write data in SequenceFile, TextFile, ORC, or Parquet format from the Hive data source.", "product_code":"dataartsstudio", "title":"What Data Formats Are Supported When the Data Source Is Hive?", "uri":"dataartsstudio_03_0029.html", "doc_type":"usermanual", - "p_code":"359", - "code":"369" + "p_code":"366", + "code":"376" }, { - "desc":"CDM does not support direct job migration across clusters. However, you can use the batch job import and export function to indirectly implement cross-cluster migration a", + "desc":"Can I synchronize jobs to other CDM clusters?CDM does not support direct job migration across clusters. However, you can use the batch job import and export function to i", "product_code":"dataartsstudio", "title":"Can I Synchronize Jobs to Other Clusters?", "uri":"dataartsstudio_03_0030.html", "doc_type":"usermanual", - "p_code":"359", - "code":"370" + "p_code":"366", + "code":"377" }, { - "desc":"CDM supports batch job creation with the help of the batch import function. You can create jobs in batches as follows:Create a job manually.Export the job and save the jo", + "desc":"Can I create CDM jobs in batches?CDM supports batch job creation with the help of the batch import function. You can create jobs in batches as follows:Create a job manual", "product_code":"dataartsstudio", "title":"Can I Create Jobs in Batches?", "uri":"dataartsstudio_03_0031.html", "doc_type":"usermanual", - "p_code":"359", - "code":"371" + "p_code":"366", + "code":"378" }, { - "desc":"Yes.Access the DataArts Factory module of the DataArts Studio service.In the navigation pane of the DataArts Factory homepage, choose Data Development > Develop Job to cr", + "desc":"Can I schedule CDM jobs in batches?Yes.Access the DataArts Factory module of the DataArts Studio service.In the navigation pane of the DataArts Factory homepage, choose D", "product_code":"dataartsstudio", "title":"Can I Schedule Jobs in Batches?", "uri":"dataartsstudio_03_0100.html", "doc_type":"usermanual", - "p_code":"359", - "code":"372" + "p_code":"366", + "code":"379" }, { - "desc":"You can use the batch export function of CDM to save all job scripts to a local PC. Then, you can create a cluster and import the jobs again when necessary.", + "desc":"How do I back up CDM jobs?You can use the batch export function of CDM to save all job scripts to a local PC. Then, you can create a cluster and import the jobs again whe", "product_code":"dataartsstudio", "title":"How Do I Back Up CDM Jobs?", "uri":"dataartsstudio_03_0032.html", "doc_type":"usermanual", - "p_code":"359", - "code":"373" + "p_code":"366", + "code":"380" }, { - "desc":"To ensure that CDM can communicate with the HANA cluster, perform the following operations:Disable Statement Routing of the HANA cluster. Note that this will increase the", + "desc":"What should I do If only some nodes in a HANA cluster can communicate with the CDM cluster?To ensure that CDM can communicate with the HANA cluster, perform the following", "product_code":"dataartsstudio", - "title":"How Do I Configure the Connection If Only Some Nodes in the HANA Cluster Can Communicate with the CDM Cluster?", + "title":"What Should I Do If Only Some Nodes in a HANA Cluster Can Communicate with the CDM Cluster?", "uri":"dataartsstudio_03_0119.html", "doc_type":"usermanual", - "p_code":"359", - "code":"374" + "p_code":"366", + "code":"381" }, { "desc":"CDM provides RESTful APIs to implement automatic job creation or execution control by program invocation.The following describes how to use CDM to migrate data from table", @@ -3371,8 +3434,8 @@ "title":"How Do I Use Java to Invoke CDM RESTful APIs to Create Data Migration Jobs?", "uri":"dataartsstudio_03_0101.html", "doc_type":"usermanual", - "p_code":"359", - "code":"375" + "p_code":"366", + "code":"382" }, { "desc":"Many enterprises deploy key data sources on the intranet, such as databases and file servers. CDM runs on the cloud. To migrate the intranet data to the cloud using CDM, ", @@ -3380,8 +3443,8 @@ "title":"How Do I Connect the On-Premises Intranet or Third-Party Private Network to CDM?", "uri":"dataartsstudio_03_0033.html", "doc_type":"usermanual", - "p_code":"359", - "code":"376" + "p_code":"366", + "code":"383" }, { "desc":"CDM migrates data through data migration jobs. It works in the following way:When data migration jobs are submitted, CDM splits each job into multiple tasks based on the ", @@ -3389,26 +3452,26 @@ "title":"How Do I Set the Number of Concurrent Extractors for a CDM Migration Job?", "uri":"dataartsstudio_03_0336.html", "doc_type":"usermanual", - "p_code":"359", - "code":"377" + "p_code":"366", + "code":"384" }, { - "desc":"No. If data is written to the source during the migration, an error may occur.", + "desc":"Does CDM support real-time migration of dynamic data?No.If data is written to the source during the migration, an error may occur.", "product_code":"dataartsstudio", "title":"Does CDM Support Real-Time Migration of Dynamic Data?", "uri":"dataartsstudio_03_0337.html", "doc_type":"usermanual", - "p_code":"359", - "code":"378" + "p_code":"366", + "code":"385" }, { - "desc":"You can use the DateUtils.format(${timestamp()},\"yyyy-MM-dd HH:mm:ss\") expression on the Map Field page to obtain the current time.", + "desc":"How do I obtain the current time using an expression?You can use the DateUtils.format(${timestamp()},\"yyyy-MM-dd HH:mm:ss\") expression on the Map Field page to obtain the", "product_code":"dataartsstudio", "title":"How Do I Obtain the Current Time Using an Expression?", "uri":"dataartsstudio_03_0340.html", "doc_type":"usermanual", - "p_code":"359", - "code":"379" + "p_code":"366", + "code":"386" }, { "desc":"When CDM is used to import data from OBS to SQL Server, the job fails to be executed and error message \"Unable to execute the SQL statement. Cause: \"String or binary data", @@ -3416,8 +3479,8 @@ "title":"What Can I Do If Error Message \"Unable to execute the SQL statement\" Is Displayed When I Import Data from OBS to SQL Server?", "uri":"dataartsstudio_03_0106.html", "doc_type":"usermanual", - "p_code":"359", - "code":"380" + "p_code":"366", + "code":"387" }, { "desc":"When CDM is used to migrate Oracle data to DWS, an error is reported, as shown in Figure 1.During data migration, if the entire table is queried and the table contains a ", @@ -3425,26 +3488,26 @@ "title":"Why Is Error ORA-01555 Reported During Migration from Oracle to DWS?", "uri":"dataartsstudio_03_0071.html", "doc_type":"usermanual", - "p_code":"359", - "code":"381" + "p_code":"366", + "code":"388" }, { - "desc":"By default, the userAdmin role has only the permissions to manage roles and users and does not have the read and write permissions on a database.If the MongoDB connection", + "desc":"Migration using a MongoDB connection fails.By default, the userAdmin role has only the permissions to manage roles and users and does not have the read and write permissi", "product_code":"dataartsstudio", - "title":"What Should I Do If the MongoDB Connection Migration Fails?", + "title":"What Should I Do If Migration Using a MongoDB Connection Fails?", "uri":"dataartsstudio_03_0072.html", "doc_type":"usermanual", - "p_code":"359", - "code":"382" + "p_code":"366", + "code":"389" }, { - "desc":"Manually stop the Hive migration job and add the following attribute settings to the Hive data connection:Attribute Name: hive.server2.idle.operation.timeoutValue: 10mIn ", + "desc":"What should I do If a Hive migration job is suspended for a long period of time?Manually stop the Hive migration job and add the following attribute settings to the Hive ", "product_code":"dataartsstudio", "title":"What Should I Do If a Hive Migration Job Is Suspended for a Long Period of Time?", "uri":"dataartsstudio_03_0093.html", "doc_type":"usermanual", - "p_code":"359", - "code":"383" + "p_code":"366", + "code":"390" }, { "desc":"When you use CDM to migrate data to DWS, the migration job fails and the error message \"value too long for type character varying\" is displayed in the execution log.The p", @@ -3452,44 +3515,44 @@ "title":"What Should I Do If an Error Is Reported Because the Field Type Mapping Does Not Match During Data Migration Using CDM?", "uri":"dataartsstudio_03_0109.html", "doc_type":"usermanual", - "p_code":"359", - "code":"384" + "p_code":"366", + "code":"391" }, { - "desc":"The following error message is displayed during MySQL migration: \"Unable to connect to the database server. Cause: connect timed out.\"The table has a large data volume, a", + "desc":"The following error message is displayed during MySQL migration: \"Unable to connect to the database server. Cause: connect timed out\"The table has a large data volume, an", "product_code":"dataartsstudio", "title":"What Should I Do If a JDBC Connection Timeout Error Is Reported During MySQL Migration?", "uri":"dataartsstudio_03_0110.html", "doc_type":"usermanual", - "p_code":"359", - "code":"385" + "p_code":"366", + "code":"392" }, { - "desc":"You are advised to clear historical data and try again. In addition, when creating a migration job, you are advised to enable the system to clear historical data. This gr", + "desc":"A CDM migration job fails after a link from Hive to GaussDB(DWS) is created.You are advised to clear historical data and try again. In addition, when creating a migration", "product_code":"dataartsstudio", - "title":"What Should I Do If a CDM Migration Job Fails After a Link from Hive to DWS Is Created?", + "title":"What Should I Do If a CDM Migration Job Fails After a Link from Hive to GaussDB(DWS) Is Created?", "uri":"dataartsstudio_03_0121.html", "doc_type":"usermanual", - "p_code":"359", - "code":"386" + "p_code":"366", + "code":"393" }, { - "desc":"CDM does not support this operation. You are advised to manually export a MySQL data file, enable the SFTP service on the server, and create a CDM job with SFTP as the so", + "desc":"How do I use CDM to export MySQL data to an SQL file and upload the file to an OBS bucket?CDM does not support this operation. You are advised to manually export a MySQL ", "product_code":"dataartsstudio", "title":"How Do I Use CDM to Export MySQL Data to an SQL File and Upload the File to an OBS Bucket?", "uri":"dataartsstudio_03_0122.html", "doc_type":"usermanual", - "p_code":"359", - "code":"387" + "p_code":"366", + "code":"394" }, { - "desc":"Dirty data writing is configured, but no dirty data exists. You need to decrease the number of concurrent tasks to avoid this issue.", + "desc":"CDM fails to migrate data from OBS to DLI.Dirty data writing is configured, but no dirty data exists. You need to decrease the number of concurrent tasks to avoid this is", "product_code":"dataartsstudio", "title":"What Should I Do If CDM Fails to Migrate Data from OBS to DLI?", "uri":"dataartsstudio_03_0123.html", "doc_type":"usermanual", - "p_code":"359", - "code":"388" + "p_code":"366", + "code":"395" }, { "desc":"This error is reported because the customer's certificate has expired. Update the certificate and reconfigure the connector.", @@ -3497,44 +3560,44 @@ "title":"What Should I Do If a CDM Connector Reports the Error \"Configuration Item [linkConfig.iamAuth] Does Not Exist\"?", "uri":"dataartsstudio_03_0132.html", "doc_type":"usermanual", - "p_code":"359", - "code":"389" + "p_code":"366", + "code":"396" }, { - "desc":"If you create a link or save a job in a CDM cluster of an earlier version, and then access a CDM cluster of a later version, this error occurs occasionally.Manually clear", + "desc":"Error message \"Configuration Item [linkConfig.createBackendLinks] Does Not Exist\" or \"Configuration Item [throttlingConfig.concurrentSubJobs] Does Not Exist\" is displayed", "product_code":"dataartsstudio", "title":"What Should I Do If Error \"Configuration Item [linkConfig.createBackendLinks] Does Not Exist\" or \"Configuration Item [throttlingConfig.concurrentSubJobs] Does Not Exist\" Is Reported?", "uri":"dataartsstudio_03_0333.html", "doc_type":"usermanual", - "p_code":"359", - "code":"390" + "p_code":"366", + "code":"397" }, { - "desc":"This failure occurs because you do not have the required permissions. Create another service user, grant the required permissions to it, and try again.To create a data co", + "desc":"Message \"CORE_0031:Connect time out. (Cdm.0523)\" is displayed during the creation of an MRS Hive link.If a message is displayed indicating that the configuration file can", "product_code":"dataartsstudio", "title":"What Should I Do If Message \"CORE_0031:Connect time out. (Cdm.0523)\" Is Displayed During the Creation of an MRS Hive Link?", "uri":"dataartsstudio_03_0166.html", "doc_type":"usermanual", - "p_code":"359", - "code":"391" + "p_code":"366", + "code":"398" }, { - "desc":"The cause is that the database table name contains special characters, resulting in incorrect syntax. You can resolve this issue by renaming the database table according ", + "desc":"Message \"CDM Does Not Support Auto Creation of an Empty Table with No Column\" is displayed when I enable auto table creation.The cause is that the database table name con", "product_code":"dataartsstudio", "title":"What Should I Do If Message \"CDM Does Not Support Auto Creation of an Empty Table with No Column\" Is Displayed When I Enable Auto Table Creation?", "uri":"dataartsstudio_03_0167.html", "doc_type":"usermanual", - "p_code":"359", - "code":"392" + "p_code":"366", + "code":"399" }, { - "desc":"This may be because you have uploaded the latest ORACLE_8 driver (for example, Oracle Database 21c (21.3) driver), which is not supported yet. You are advised to use the ", + "desc":"I cannot obtain the schema name when creating an Oracle relational database migration job.The latest ORACLE_8 driver, which is not supported, may have been uploaded, for ", "product_code":"dataartsstudio", "title":"What Should I Do If I Cannot Obtain the Schema Name When Creating an Oracle Relational Database Migration Job?", "uri":"dataartsstudio_03_0334.html", "doc_type":"usermanual", - "p_code":"359", - "code":"393" + "p_code":"366", + "code":"400" }, { "desc":"The MySQL database stores values 0 and 1, rather than true and false. However, true or false is read during MySQL database migration, and the following error information ", @@ -3542,8 +3605,8 @@ "title":"What Should I Do If invalid input syntax for integer: \"true\" Is Displayed During MySQL Database Migration?", "uri":"dataartsstudio_03_0341.html", "doc_type":"usermanual", - "p_code":"359", - "code":"394" + "p_code":"366", + "code":"401" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -3551,152 +3614,152 @@ "title":"DataArts Factory", "uri":"dataartsstudio_03_0035.html", "doc_type":"usermanual", - "p_code":"342", - "code":"395" + "p_code":"349", + "code":"402" }, { - "desc":"By default, each user can create a maximum of 10,000 jobs, and each job can contain a maximum of 200 nodes.", + "desc":"Whether the number of jobs and the number of nodes in a job are limited during data developmentBy default, each user can create a maximum of 10,000 jobs, and each job can", "product_code":"dataartsstudio", "title":"How Many Jobs Can Be Created in DataArts Factory? Is There a Limit on the Number of Nodes in a Job?", "uri":"dataartsstudio_03_0036.html", "doc_type":"usermanual", - "p_code":"395", - "code":"396" + "p_code":"402", + "code":"403" }, { - "desc":"Yes.", + "desc":"Whether DataArts Studio supports custom Python scriptsYes.", "product_code":"dataartsstudio", "title":"Does DataArts Studio Support Custom Python Scripts?", "uri":"dataartsstudio_03_0126.html", "doc_type":"usermanual", - "p_code":"395", - "code":"397" + "p_code":"402", + "code":"404" }, { - "desc":"On the Running History page, there is a large difference between Job Execution Time and Start Time, as shown in the figure below. Job Execution Time is the time when the ", + "desc":"On the Running History page, there is a large difference between Job Execution Time and Start Time. Job Execution Time is the time when the job is expected to be executed", "product_code":"dataartsstudio", "title":"Why Is There a Large Difference Between Job Execution Time and Start Time of a Job?", "uri":"dataartsstudio_03_0041.html", "doc_type":"usermanual", - "p_code":"395", - "code":"398" + "p_code":"402", + "code":"405" }, { - "desc":"The subsequent jobs may be suspended, continued, or canceled, depending on the configuration.In this case, do not stop the job. You can rerun the failed job instance or s", + "desc":"One of the jobs that depend on each other fails during scheduling.The subsequent jobs may be suspended, continued, or canceled, depending on the configuration.In this cas", "product_code":"dataartsstudio", "title":"Will Subsequent Jobs Be Affected If a Job Fails to Be Executed During Scheduling of Dependent Jobs? What Should I Do?", "uri":"dataartsstudio_03_0042.html", "doc_type":"usermanual", - "p_code":"395", - "code":"399" + "p_code":"402", + "code":"406" }, { - "desc":"Lock management is unavailable for DLI and MRS. Therefore, if you perform read and write operations on the tables simultaneously, data conflict will occur and the operati", + "desc":"Notes for scheduling big data services using DataArts StudioLock management is unavailable for DLI and MRS. Therefore, if you perform read and write operations on the tab", "product_code":"dataartsstudio", "title":"What Should I Pay Attention to When Using DataArts Studio to Schedule Big Data Services?", "uri":"dataartsstudio_03_0149.html", "doc_type":"usermanual", - "p_code":"395", - "code":"400" + "p_code":"402", + "code":"407" }, { - "desc":"Parameters can be set in environment variables, job parameters, and script parameters, but their application scopes are different. If there is a conflict when parameters ", + "desc":"Differences and relationships between environment variables, job parameters, and script parametersThe application scopes of workspace environment variables, job parameter", "product_code":"dataartsstudio", - "title":"What Are the Differences and Connections Among Environment Variables, Job Parameters, and Script Parameters?", + "title":"What Are the Differences and Relationships Between Environment Variables, Job Parameters, and Script Parameters?", "uri":"dataartsstudio_03_0136.html", "doc_type":"usermanual", - "p_code":"395", - "code":"401" + "p_code":"402", + "code":"408" }, { - "desc":"Job logs are stored in OBS buckets. You must configure the bucket directory for storing job logs in the workspace and check whether the your account has the OBS read perm", + "desc":"You do not have the required permissions.Job logs are stored in OBS buckets. You must configure the bucket directory for storing job logs in the workspace and check wheth", "product_code":"dataartsstudio", - "title":"What Should I Do If Job Logs Cannot Be Opened and Error 404 Is Reported?", + "title":"What Should I Do If a Job Log Cannot Be Opened and Error 404 Is Reported?", "uri":"dataartsstudio_03_0050.html", "doc_type":"usermanual", - "p_code":"395", - "code":"402" + "p_code":"402", + "code":"409" }, { - "desc":"When a workspace- or job-level agency is configured, the following error is reported when the agency list is viewed:Policy doesn't allow iam:agencies:listAgencies to be p", + "desc":"If error message \"Policy doesn't allow iam:agencies:listAgencies to be performed.\" is displayed when you are creating a workspace-level or job-level agency, you may lack ", "product_code":"dataartsstudio", "title":"What Should I Do If the Agency List Fails to Be Obtained During Agency Configuration?", "uri":"dataartsstudio_03_0051.html", "doc_type":"usermanual", - "p_code":"395", - "code":"403" + "p_code":"402", + "code":"410" }, { - "desc":"Ensure that the current instance and peripheral resources are in the same region and IAM project. If the enterprise project function is enabled for your account, the curr", + "desc":"The specified peripheral resources may not be in the same region as the instance.Ensure that the current DataArts Studio instance and peripheral resources are in the same", "product_code":"dataartsstudio", - "title":"Why Cannot Specified Peripheral Resources Be Selected When a Data Connection Is Created in Data Development?", + "title":"Why Can't I Select Specified Peripheral Resources When Creating a Data Connection in DataArts Factory?", "uri":"dataartsstudio_03_0056.html", "doc_type":"usermanual", - "p_code":"395", - "code":"404" + "p_code":"402", + "code":"411" }, { - "desc":"On the Data Development page, choose MonitoringMonitor Job to check whether the target job is being scheduled. A job can be scheduled only within the scheduling period.Vi", + "desc":"Why Is There No Job Running Scheduling Log on the Monitor Instance Page After Periodic Scheduling Is Configured for a Job? This job has not been started or the job on whi", "product_code":"dataartsstudio", "title":"Why Is There No Job Running Scheduling Log on the Monitor Instance Page After Periodic Scheduling Is Configured for a Job?", "uri":"dataartsstudio_03_0058.html", "doc_type":"usermanual", - "p_code":"395", - "code":"405" + "p_code":"402", + "code":"412" }, { - "desc":"Check whether the data connection used by the Hive SQL and Spark SQL scripts is direct connection or proxy connection.In direct connection mode, DataArts Studio users sub", + "desc":"This issue may be caused by the connection mode.Check whether the data connection used by the Hive SQL and Spark SQL scripts is an MRS API connection or proxy connection.", "product_code":"dataartsstudio", - "title":"Why does the GUI display only the failure result but not the specific error cause after Hive SQL and Spark SQL scripts fail to be executed?", + "title":"Why Isn't the Error Cause Displayed on the Console When a Hive SQL or Spark SQL Scripts Fails?", "uri":"dataartsstudio_03_0059.html", "doc_type":"usermanual", - "p_code":"395", - "code":"406" + "p_code":"402", + "code":"413" }, { - "desc":"Check whether the permissions of the current user in IAM are changed, whether the user is removed from the user group, or whether the permission policy of the user group ", + "desc":"During the execution of a data development node, a message is displayed indicating that the token is invalid.Check whether the permissions of the current user in IAM are ", "product_code":"dataartsstudio", - "title":"What Do I Do If the Token Is Invalid During the Running of a Data Development Node?", + "title":"What Should I Do If the Token Is Invalid During the Execution of a Data Development Node?", "uri":"dataartsstudio_03_0060.html", "doc_type":"usermanual", - "p_code":"395", - "code":"407" + "p_code":"402", + "code":"414" }, { - "desc":"Method 1: After the node test is complete, right-click the current node and choose View Log from the shortcut menu.Method 2: Click Monitorin the upper part of the canvas,", + "desc":"How to view run logs after testing a jobMethod 1: After the node test is complete, right-click the current node and choose View Log from the shortcut menu.Method 2: Click", "product_code":"dataartsstudio", "title":"How Do I View Run Logs After a Job Is Tested?", "uri":"dataartsstudio_03_0062.html", "doc_type":"usermanual", - "p_code":"395", - "code":"408" + "p_code":"402", + "code":"415" }, { - "desc":"Jobs scheduled by month depend on jobs scheduled by day. Why does a job scheduled by month start running before the job scheduled by day is complete?Although jobs schedul", + "desc":"The monthly job depends on daily jobs of the previous month rather than the current month.Jobs scheduled by month depend on jobs scheduled by day. Why does a job schedule", "product_code":"dataartsstudio", "title":"Why Does a Job Scheduled by Month Start Running Before the Job Scheduled by Day Is Complete?", "uri":"dataartsstudio_03_0063.html", "doc_type":"usermanual", - "p_code":"395", - "code":"409" + "p_code":"402", + "code":"416" }, { - "desc":"Check whether the current user has the DLI Service User or DLI Service Admin permissions in IAM.", + "desc":"This issue may be caused by insufficient permissions.Check whether the current user has the DLI Service User or DLI Service Admin permissions in IAM.", "product_code":"dataartsstudio", "title":"What Should I Do If Invalid Authentication Is Reported When I Run a DLI Script?", "uri":"dataartsstudio_03_0065.html", "doc_type":"usermanual", - "p_code":"395", - "code":"410" + "p_code":"402", + "code":"417" }, { - "desc":"Check whether the CDM cluster is stopped. If it is stopped, restart it.", + "desc":"The CDM cluster may be stopped.Check whether the CDM cluster is stopped. If it is stopped, restart it.", "product_code":"dataartsstudio", - "title":"Why Cannot I Select the Desired CDM Cluster in Proxy Mode When Creating a Data Connection?", + "title":"Why Cannot I Select a Desired CDM Cluster in Proxy Mode When Creating a Data Connection?", "uri":"dataartsstudio_03_0066.html", "doc_type":"usermanual", - "p_code":"395", - "code":"411" + "p_code":"402", + "code":"418" }, { "desc":"Daily scheduling is configured for the job, but there is no job scheduling record in the instance.Cause 1: Check whether the job scheduling is started. If not, the job wi", @@ -3704,8 +3767,8 @@ "title":"Why Is There No Job Running Scheduling Record After Daily Scheduling Is Configured for the Job?", "uri":"dataartsstudio_03_0111.html", "doc_type":"usermanual", - "p_code":"395", - "code":"412" + "p_code":"402", + "code":"419" }, { "desc":"There is no content contained in the job log.If the bucket directory for storing job logs has been configured in the workspace, check whether you have the global permissi", @@ -3713,8 +3776,8 @@ "title":"What Do I Do If No Content Is Displayed in Job Logs?", "uri":"dataartsstudio_03_0112.html", "doc_type":"usermanual", - "p_code":"395", - "code":"413" + "p_code":"402", + "code":"420" }, { "desc":"Two jobs are created, but the dependency relationship cannot be established.Check whether the two jobs' recurrence are both every week or every month. Currently, if the t", @@ -3722,26 +3785,26 @@ "title":"Why Do I Fail to Establish a Dependency Between Two Jobs?", "uri":"dataartsstudio_03_0113.html", "doc_type":"usermanual", - "p_code":"395", - "code":"414" + "p_code":"402", + "code":"421" }, { - "desc":"An error is reported when DataArts Studio executes scheduling: The job does not have a submitted version. Submit the job version first.Job scheduling process begins befor", + "desc":"An error is reported during job scheduling in DataArts Studio, indicating that the job has not been submitted.Job scheduling process begins before the version is submitte", "product_code":"dataartsstudio", - "title":"What Should I Do If an Error Is Displayed During DataArts Studio Scheduling: The Job Does Not Have a Submitted Version?", + "title":"What Should I Do If an Error Is Reported During Job Scheduling in DataArts Studio, Indicating that the Job Has Not Been Submitted?", "uri":"dataartsstudio_03_0114.html", "doc_type":"usermanual", - "p_code":"395", - "code":"415" + "p_code":"402", + "code":"422" }, { "desc":"An error is reported when DataArts Studio executes scheduling: The script associated with node XXX in the job is not submitted.Job scheduling process begins before the sc", "product_code":"dataartsstudio", - "title":"What Do I Do If an Error Is Displayed During DataArts Studio Scheduling: The Script Associated with Node XXX in the Job Is Not Submitted?", + "title":"What Should I Do If an Error Is Reported During Job Scheduling in DataArts Studio, Indicating that the Script Associated with Node XXX in the Job Has Not Been Submitted?", "uri":"dataartsstudio_03_0115.html", "doc_type":"usermanual", - "p_code":"395", - "code":"416" + "p_code":"402", + "code":"423" }, { "desc":"After a job is submitted for scheduling, the job fails to be executed and the following error is displayed \"depend job [XXX] is not running or pause\".The upstream depende", @@ -3749,71 +3812,71 @@ "title":"What Should I Do If a Job Fails to Be Executed After Being Submitted for Scheduling and an Error Displayed: Depend Job [XXX] Is Not Running Or Pause?", "uri":"dataartsstudio_03_0116.html", "doc_type":"usermanual", - "p_code":"395", - "code":"417" + "p_code":"402", + "code":"424" }, { - "desc":"Databases and data tables can be created in DLI.A database does not correspond to a data connection. A data connection is a connection channel for creating DataArts Studi", + "desc":"This section describes how to create databases and data tables, and the relationship between databases and data connections.You can create databases and data tables in Da", "product_code":"dataartsstudio", - "title":"How Do I Create a Database And Data Table? Is the database a data connection?", + "title":"How Do I Create Databases and Data Tables? Do Databases Correspond to Data Connections?", "uri":"dataartsstudio_03_0127.html", "doc_type":"usermanual", - "p_code":"395", - "code":"418" + "p_code":"402", + "code":"425" }, { - "desc":"Solution: Clear the cache data and use the direct connection to display the data.", + "desc":"The connection mode may be incorrect.Clear the cache data and use the direct connection to display the data.", "product_code":"dataartsstudio", - "title":"Why Is No Result Displayed After an HIVE Task Is Executed?", + "title":"Why Is No Result Displayed After a Hive Task Is Executed?", "uri":"dataartsstudio_03_0129.html", "doc_type":"usermanual", - "p_code":"395", - "code":"419" + "p_code":"402", + "code":"426" }, { - "desc":"The last instance status indicates a job has been executed, and the status can only be successful or failed. The Monitor Instance page displays all statuses of the job, i", + "desc":"The Last Instance Status on the Monitor Instance page is either successful or failed.The last instance status indicates a job has been executed, and the status can only b", "product_code":"dataartsstudio", - "title":"Why Does the Last Instance Status On the Monitor Instance page Only Display Succeeded or Failed?", + "title":"Why Is the Last Instance Status On the Monitor Instance Page Either Successful or Failed?", "uri":"dataartsstudio_03_0135.html", "doc_type":"usermanual", - "p_code":"395", - "code":"420" + "p_code":"402", + "code":"427" }, { - "desc":"Choose Monitoring > Monitor Job and click the Batch Job Monitoring tab.Select the jobs to be configured and click Configure Notification.Creating a notificationSet notifi", + "desc":"How to configure notifications for all jobsOn the DataArts Studio console, locate a workspace and click DataArts Factory.In the navigation pane on the left, choose Monito", "product_code":"dataartsstudio", - "title":"How Do I Create a Notification for All Jobs?", + "title":"How Do I Configure Notifications for All Jobs?", "uri":"dataartsstudio_03_0148.html", "doc_type":"usermanual", - "p_code":"395", - "code":"421" + "p_code":"402", + "code":"428" }, { - "desc":"Currently, the time zone of a DataArts Studio instance cannot be changed.During the scheduling of data development jobs, an EL expression can be used to adapt to the loca", + "desc":"Whether the time zone of a DataArts Studio instance can be changed. If not, how can the time of a DataArts Studio instance be adapted to the local time.Currently, the tim", "product_code":"dataartsstudio", "title":"Can I Change the Time Zone of a DataArts Studio Instance?", "uri":"dataartsstudio_03_0193.html", "doc_type":"usermanual", - "p_code":"395", - "code":"422" + "p_code":"402", + "code":"429" }, { - "desc":"After renaming a CDM job, you need to select the renamed CDM job in the CDM node attributes on the DataArts Factory console.", + "desc":"Updated names of CDM jobs cannot be synchronized to DataArts Factory.After renaming a CDM job, you need to select the renamed CDM job in the CDM node attributes on the Da", "product_code":"dataartsstudio", "title":"How Do I Synchronize the Changed Names of CDM Jobs to DataArts Factory?", "uri":"dataartsstudio_03_0194.html", "doc_type":"usermanual", - "p_code":"395", - "code":"423" + "p_code":"402", + "code":"430" }, { - "desc":"By default, the hll plug-in is created in the public schema. The SQL statement must contain the schema to which the hll belongs.", + "desc":"An RDS SQL statement fails to be executed and an error is reported indicating that hll does not exist.By default, the hll plug-in is created in the public schema. The SQL", "product_code":"dataartsstudio", "title":"Why Does the Execution of an RDS SQL Statement Fail and an Error Is Reported Indicating That hll Does Not Exist?", "uri":"dataartsstudio_03_0400.html", "doc_type":"usermanual", - "p_code":"395", - "code":"424" + "p_code":"402", + "code":"431" }, { "desc":"If the number of incorrect password attempts for connecting to the DWS cluster reaches the value of failed_login_attempts (10 by default), the account is automatically lo", @@ -3821,98 +3884,98 @@ "title":"What Should I Do If Error Message \"The account has been locked\" Is Displayed When I Am Creating a DWS Data Connection?", "uri":"dataartsstudio_03_0402.html", "doc_type":"usermanual", - "p_code":"395", - "code":"425" + "p_code":"402", + "code":"432" }, { - "desc":"Some jobs on which this job instance depends failed. You can click the question mark (?) on the right of the instance status to view the failed jobs.", + "desc":"A job instance is canceled and message \"The node start execute failed, so the current node status is set to cancel.\" is displayed.Some jobs on which this job depends fail", "product_code":"dataartsstudio", - "title":"Why Is a Job Instance Canceled and Message \"The node start execute failed, so the current node status is set to cancel.\" Displayed?", + "title":"What Should I Do If a Job Instance Is Canceled and Message \"The node start execute failed, so the current node status is set to cancel.\" Is Displayed?", "uri":"dataartsstudio_03_0403.html", "doc_type":"usermanual", - "p_code":"395", - "code":"426" + "p_code":"402", + "code":"433" }, { - "desc":"Add the project ID to the request header in the code, that is, header.add(\"X-Project-Id\",Project ID).", + "desc":"Error message \"Workspace does not exists\" is displayed when I call a DataArts Factory API.Add the project ID to the request header in the code, that is, header.add(\"X-Pro", "product_code":"dataartsstudio", "title":"What Should I Do If Error Message \"Workspace does not exists\" Is Displayed When I Call a DataArts Factory API?", "uri":"dataartsstudio_03_0404.html", "doc_type":"usermanual", - "p_code":"395", - "code":"427" + "p_code":"402", + "code":"434" }, { - "desc":"The connector (&) for URL parameters must be escaped.", + "desc":"The URL parameters for calling an API take effect in the test environment when the API can be called properly using Postman.Escape the connector (&) for URL parameters.", "product_code":"dataartsstudio", "title":"Why Don't the URL Parameters for Calling an API Take Effect in the Test Environment When the API Can Be Called Properly Using Postman?", "uri":"dataartsstudio_03_0405.html", "doc_type":"usermanual", - "p_code":"395", - "code":"428" + "p_code":"402", + "code":"435" }, { - "desc":"Use a CDM cluster of version 2.8.6 or a later version when creating a host connection.", + "desc":"The version of the CDM cluster selected during host connection creation may be too early.Use a CDM cluster of version 2.8.6 or a later version when creating a host connec", "product_code":"dataartsstudio", "title":"What Should I Do If Error Message \"Agent need to be updated?\" Is Displayed When I Run a Python Script?", "uri":"dataartsstudio_03_0406.html", "doc_type":"usermanual", - "p_code":"395", - "code":"429" + "p_code":"402", + "code":"436" }, { - "desc":"The Succeed operation was performed on the node, which changed the job instance (and node) status to successful.", + "desc":"An execution failure is displayed for a node whose status is successful.The Succeed operation was performed on the node, which changed the job instance (and node) status ", "product_code":"dataartsstudio", "title":"Why Is an Execution Failure Displayed for a Node in the Log When the Node Status Is Successful?", "uri":"dataartsstudio_03_0407.html", "doc_type":"usermanual", - "p_code":"395", - "code":"430" + "p_code":"402", + "code":"437" }, { - "desc":"DataArts Studio is a project-level service. Choose a project-level token.", + "desc":"An unknown exception occurs when I call a DataArts Factory API.DataArts Studio is a project-level service. Choose a project-level token.", "product_code":"dataartsstudio", "title":"What Should I Do If an Unknown Exception Occurs When I Call a DataArts Factory API?", "uri":"dataartsstudio_03_0408.html", "doc_type":"usermanual", - "p_code":"395", - "code":"431" + "p_code":"402", + "code":"438" }, { - "desc":"The resource name can contain a maximum of 32 characters, including only letters, digits, underscores (_), and hyphens (-).", + "desc":"An error message indicating an invalid resource name is displayed when I call a resource creation API?The resource name can contain a maximum of 32 characters, including ", "product_code":"dataartsstudio", "title":"Why Is an Error Message Indicating an Invalid Resource Name Is Displayed When I Call a Resource Creation API?", "uri":"dataartsstudio_03_0409.html", "doc_type":"usermanual", - "p_code":"395", - "code":"432" + "p_code":"402", + "code":"439" }, { - "desc":"The PatchData task may contain jobs in other workspaces. You can check the statuses of the job instance of the PatchData task in other workspaces.", + "desc":"A PatchData task fails when all PatchData job instances are successful.The PatchData task may contain jobs in other workspaces. You can check the statuses of the job inst", "product_code":"dataartsstudio", "title":"Why Does a PatchData Task Fail When All PatchData Job Instances Are Successful?", "uri":"dataartsstudio_03_0410.html", "doc_type":"usermanual", - "p_code":"395", - "code":"433" + "p_code":"402", + "code":"440" }, { - "desc":"The table already exists, but you do not have permissions to view and edit it.", + "desc":"Role permissions are insufficient.The table already exists, but you do not have permissions to view and edit it.", "product_code":"dataartsstudio", "title":"Why Is a Table Unavailable When an Error Message Indicating that the Table Already Exists Is Displayed During Table Creation from a DWS Data Connection?", "uri":"dataartsstudio_03_0411.html", "doc_type":"usermanual", - "p_code":"395", - "code":"434" + "p_code":"402", + "code":"441" }, { - "desc":"The following figure shows the error.MRS APIs can be called by a single user for a maximum of 60 times per minute. Therefore, the solution is to call the API less frequen", + "desc":"Error message \"The throttling threshold has been reached: policy user over ratelimit,limit:60,time:1 minute\" is displayed when I schedule an MRS Spark job.MRS APIs can be", "product_code":"dataartsstudio", "title":"What Should I Do If Error Message \"The throttling threshold has been reached: policy user over ratelimit,limit:60,time:1 minute.\" Is Displayed When I Schedule an MRS Spark Job?", "uri":"dataartsstudio_03_0415.html", "doc_type":"usermanual", - "p_code":"395", - "code":"435" + "p_code":"402", + "code":"442" }, { "desc":"This error occurs when json.dumps(json_data, ensure_ascii=False) is configured in the Python script. The following figure shows the error.By default, DataArts Studio uses", @@ -3920,8 +3983,8 @@ "title":"What Should I Do If Error Message \"UnicodeEncodeError: 'ascii' codec can't encode characters in position 63-64: ordinal not in range(128)\" Is Displayed When I Run a Python Script?", "uri":"dataartsstudio_03_0417.html", "doc_type":"usermanual", - "p_code":"395", - "code":"436" + "p_code":"402", + "code":"443" }, { "desc":"When you view the logs of a data development node, the error message shown in the following figure is displayed.Logs of data development jobs are stored in OBS buckets. T", @@ -3929,8 +3992,8 @@ "title":"What Should I Do If an Error Message Is Displayed When I View Logs?", "uri":"dataartsstudio_03_0418.html", "doc_type":"usermanual", - "p_code":"395", - "code":"437" + "p_code":"402", + "code":"444" }, { "desc":"This section uses the Shell node as an example.The Shell node fails to be executed, but the Shell script is executed successfully.Obtain the run logs of the Shell node.[2", @@ -3938,8 +4001,8 @@ "title":"What Should I Do If a Shell/Python Node Fails and Error \"session is down\" Is Reported?", "uri":"dataartsstudio_03_0618.html", "doc_type":"usermanual", - "p_code":"395", - "code":"438" + "p_code":"402", + "code":"445" }, { "desc":"The Rest Client operator is used as an example.When configuring a parameter for a job operator, you need to enter the parameter name and value. If you already enter 512 c", @@ -3947,35 +4010,62 @@ "title":"What Should I Do If a Parameter Value in a Request Header Contains More Than 512 Characters?", "uri":"dataartsstudio_03_0619.html", "doc_type":"usermanual", - "p_code":"395", - "code":"439" + "p_code":"402", + "code":"446" }, { - "desc":"This issue is caused by the case of id.During the execution of a DWS SQL script, the system uses lowercase letters by default. If a field is in upper case, add \"\".Example", + "desc":"This issue is caused by the case of the ID.During the execution of a DWS SQL script, the system uses lowercase letters by default. If a field is in upper case, add \"\".Exa", "product_code":"dataartsstudio", "title":"What Should I Do If a Message Is Displayed Indicating that the ID Does Not Exist During the Execution of a DWS SQL Script?", "uri":"dataartsstudio_03_0620.html", "doc_type":"usermanual", - "p_code":"395", - "code":"440" + "p_code":"402", + "code":"447" }, { - "desc":"In the left navigation pane of DataArts Factory, choose MonitoringJob Monitoring.Click the Batch Job Monitoring tab.Query the scheduling and execution of the CDM job by f", + "desc":"Jobs that invoke a CDM jobIn the left navigation pane of DataArts Factory, choose MonitoringJob Monitoring.Click the Batch Job Monitoring tab.Query the scheduling and exe", "product_code":"dataartsstudio", "title":"How Do I Check Which Jobs Invoke a CDM Job?", "uri":"dataartsstudio_03_0621.html", "doc_type":"usermanual", - "p_code":"395", - "code":"441" + "p_code":"402", + "code":"448" }, { - "desc":"Symptom:Error message \"The request parameter invalid\" is displayed when Python is used to call the API for executing scripts.Call the script execution API by following th", + "desc":"Error message \"The request parameter invalid\" is displayed when Python is used to call the API for executing scripts.Call the script execution API by following the instru", "product_code":"dataartsstudio", "title":"What Should I Do If Error Message \"The request parameter invalid\" Is Displayed When I Use Python to Call the API for Executing Scripts?", "uri":"dataartsstudio_03_0623.html", "doc_type":"usermanual", - "p_code":"395", - "code":"442" + "p_code":"402", + "code":"449" + }, + { + "desc":"The default queue of a new DLI SQL script has been deleted.When a DLI SQL script is used or opened, the queue selected for the script is stored in the cache. This queue i", + "product_code":"dataartsstudio", + "title":"What Should I Do If the Default Queue of a New DLI SQL Script in DataArts Factory Has Been Deleted?", + "uri":"dataartsstudio_03_0628.html", + "doc_type":"usermanual", + "p_code":"402", + "code":"450" + }, + { + "desc":"During the configuration of a job in DataArts Factory, offline Kafka cannot be selected when Scheduling Type is set to Event-based and Event Type is set to KAFKA.Only MRS", + "product_code":"dataartsstudio", + "title":"Does the Event-based Scheduling Type in DataArts Factory Support Offline Kafka?", + "uri":"dataartsstudio_03_0629.html", + "doc_type":"usermanual", + "p_code":"402", + "code":"451" + }, + { + "desc":"Error messages:Failed to query the user who submits the job on MRS Manager. The error code is 0191.The current user does not exist on MRS Manager. Grant the user sufficie", + "product_code":"dataartsstudio", + "title":"What Should I Do If an Error Is Reported When I Submit an MRS Job with an Agency Through an MRS Cluster Connected Using an MRS API or the MRS Tenant Plane?", + "uri":"dataartsstudio_03_0630.html", + "doc_type":"usermanual", + "p_code":"402", + "code":"452" }, { "desc":"HUAWEI CLOUD Help Center presents technical documents to help you quickly get started with HUAWEI CLOUD services. The technical documents include Service Overview, Price Details, Purchase Guide, User Guide, API Reference, Best Practices, FAQs, and Videos.", @@ -3984,6 +4074,6 @@ "uri":"dataartsstudio_12_0010.html", "doc_type":"usermanual", "p_code":"", - "code":"443" + "code":"453" } ] \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0001.html b/docs/dataartsstudio/umn/dataartsstudio_01_0001.html index ed31a638b..bfc3f7bcf 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0001.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0001.html @@ -1,9 +1,9 @@

Accessing the DataArts Studio Instance Console

-

Prerequisites

A DataArts Studio instance has been obtained. For details, see Creating a DataArts Studio Basic Package.

+

Prerequisites

You have obtained a DataArts Studio instance. For details, see Creating a DataArts Studio Instance.

-

Procedure

  1. Log in to the cloud console. Choose DataArts Studio from the service list in the upper left corner to access the DataArts Studio instance console.

    • If there are multiple DataArts Studio instances in the current region, the instance list is displayed by default. Locate an instance and click Access to access the DataArts Studio console.

      +

      Procedure

      1. Log in to the cloud console. Choose DataArts Studio from the service list in the upper left corner.

        • If there are multiple DataArts Studio instances in the current region, the instance list is displayed by default. Locate an instance and click Access to access the DataArts Studio console homepage.

        • If there is only one DataArts Studio instance in the current region, the DataArts Studio console homepage is displayed by default.

          @@ -14,7 +14,7 @@
      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0003.html b/docs/dataartsstudio/umn/dataartsstudio_01_0003.html deleted file mode 100644 index 46f5709c3..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0003.html +++ /dev/null @@ -1,13 +0,0 @@ - - -

      Preparations

      -

      Before using DataArts Studio, you need to create a a cloud platform account, create a DataArts Studio instance, access the DataArts Studio instance console, manage workspaces, and authorize users to use DataArts Studio.

      -

      The following figure shows the preparations and operations, which will be described in detail in later sections.

      -
      Figure 1 Preparations for using DataArts Studio
      -
      -
      - -
      - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0004.html b/docs/dataartsstudio/umn/dataartsstudio_01_0004.html index a4dfc6290..b18be2262 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0004.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0004.html @@ -1,27 +1,29 @@ -

      Creating an IAM User and Assigning DataArts Studio Permissions

      -
      Identity and Access Management (IAM) can be used for fine-grained permissions management on your DataArts Studio resources. With IAM, you can:
      • Create IAM users for employees based on your enterprise's organizational structure. Each IAM user will have their own security credentials for accessing DataArts Studio resources.
      • Assign users only the permissions required to perform a task.
      • Entrust a a cloud platform account or cloud service to perform efficient O&M on your DataArts Studio resources.
      +

      Creating an IAM User and Assigning DataArts Studio Permissions

      +
      Identity and Access Management (IAM) can be used for fine-grained permissions management on your DataArts Studio resources. With IAM, you can:
      • Create IAM users for employees based on your enterprise's organizational structure. Each IAM user will have their own security credentials for accessing DataArts Studio resources.
      • Grant users only the permissions required to perform a given task based on their job responsibilities.
      • Entrust a cloud account or cloud service to perform efficient O&M on your DataArts Studio resources.
      -

      If you do not require individual IAM users for permissions management, skip this section.

      -

      Background

      • Before assigning permissions to a user group, you need to understand the DataArts Studio permission system and select permissions as needed.
      -
      -

      Notes and Constraints

      • The DARTS User role provides permissions related to instances, workspaces, and dependent services. Workspace roles provide service operation permissions in workspaces.
      • IAM provides the following two authorization mechanisms. DataArts Studio supports IAM roles but not IAM policies.
        • IAM roles: IAM initially provides a coarse-grained authorization mechanism to define permissions based on users' job responsibilities. Only a limited number of service-level roles are available for authorization. However, traditional IAM roles are not an ideal choice for fine-grained authorization and secure access control.
        • IAM policies: A type of fine-grained authorization mechanism that defines permissions required to perform operations on specific cloud resources under certain conditions. This type of authorization is more flexible and meets the principle of least privilege (PoLP).
        +

        If you do not require individual IAM users for permissions management, skip this topic.

        +

        This section describes the procedure for granting permissions. See Procedure for details.

        +

        Context

        • Before assigning permissions to a user group, you need to understand the permission system of so that you can select the permissions that meet your needs.
          Figure 1 Permission system
        -

        Procedure

        Figure 1 Authorization process
        -
        1. Create a user group and assign a system role to the group.

          Log in to the IAM console using a cloud platform account, create a user group and assign a DataArts Studio system role to the group. For example, the system role can be DARTS Administrator or DARTS User.

          -

          For details, see "User Groups and Authorization" > "Creating a User Group and Assigning Permissions" in Identity and Access Management User Guide.

          -
          • When configuring DataArts Studio permissions for a user group, enter DARTS in the search box to search for the permissions and select the permissions to be granted to the user group, for example, DARTS User.
          • DataArts Studio is a project-level service deployed in specific physical regions. If you select All resources for Scope, the permission takes effect in all projects of all regions. If you select Region-specific projects for Scope, the permission takes effect only for a specified project. When accessing DataArts Studio, the IAM user must switch to the region where they have been assigned the required permissions.
          +

          Notes and Constraints

          • The DARTS User system role provides the permissions related to instances, workspaces, and dependent services. The operation permissions in workspaces are provided by workspace roles.
          • IAM provides the following two authorization mechanisms: Note that DataArts Studio supports only the IAM role-based authorization and does not support the IAM policy-based authorization.
            • IAM Roles: IAM initially provides a coarse-grained authorization mechanism to define permissions based on users' job responsibilities. Only a limited number of service-level roles are available. However, traditional IAM roles are not an ideal choice for fine-grained authorization and secure access control.
            • IAM Policies: A type of fine-grained authorization mechanism that defines permissions required to perform operations on specific cloud resources under certain conditions. This type of authorization is more flexible and is ideal for least privilege access.
            +
            +
          +
          +

          Procedure

          1. Create a user group and assign a system role to the group.

            Log in to the IAM console using a cloud account, create a user group and assign a DataArts Studio system role to the group. For example, the system role can be DARTS Administrator or DARTS User.

            +

            For details, see "User Groups and Authorization" > "Creating a User Group and Assigning Permissions" in Identity and Access Management User Guide.

            +
            • When configuring DataArts Studio permissions for a user group, enter DARTS in the search box to search for the permissions and select the permissions to be granted to the user group, for example, DARTS User.
            • DataArts Studio is a project-level service deployed in specific physical regions. If you select All resources for Scope, the permission takes effect in all projects of all regions. If you select Region-specific projects for Scope, the permission takes effect only for a specified project. When accessing DataArts Studio, the IAM user must switch to the region where they have been assigned the required permissions.
            -

          2. Create a user and add it to the user group.

            Create users on the IAM console and add them to the group created in step 1.

            -

            For details, see "IAM Users" > "Creating an IAM User" in Identity and Access Management User Guide.

            -

            An IAM user can pass the authentication and access DataArts Studio through an API or SDK only if Programmatic access is selected for Access Type during the creation of the IAM user.

            +

          3. Create a user and add the user to the user group.

            Create users on the IAM console and add them to the group created in Step 1.

            +

            For details, see "IAM Users" > "Creating an IAM User" in Identity and Access Management User Guide.

            +

            An IAM user can pass the authentication and access DataArts Studio through an API or SDK only if Programmatic access is selected for Access Type during the creation of the IAM user.

            -

          4. Create a custom workspace role for DARTS User, add it as a workspace member, and assign a role to the member.

            DataArts Studio workspace roles determine the permissions of DARTS User in a workspace. There are five preset roles: admin, developer, deployer, operator, and viewer. If these preset roles can meet your requirements, you do not need to create a custom workspace role. Instead, you can add the user as a workspace member and assign a preset role to the member. Otherwise, you need to create a custom role, add the users as a workspace member, and assign the custom role to the member. For details about how to create a custom workspace role, see (Optional) Defining a Workspace Role. For details about how to add a workspace member and assign a role to the member, see Adding a Member and Assigning a Role.

            -

            For details about the permissions of the roles, see "DataArts Studio Permissions" in Service Overview.

            +

          5. Create a custom workspace role for DARTS User, add it as a workspace member, and assign a role to the member.

            DataArts Studio workspace roles determine the permissions of DARTS User in a workspace. There are five preset roles: admin, developer, deployer, operator, and viewer. If these preset roles can meet your requirements, you do not need to create a custom workspace role. Instead, you can add the user as a workspace member and assign a preset role to the member. Otherwise, you need to create a custom role, add the users as a workspace member, and assign a custom role to the member. For details about how to create a custom workspace role, see (Optional) Defining a Workspace RoleFor details about how to add a workspace member and assign a role, see Adding Workspace Members and Assigning Roles.

            +

            For details about the permissions of the roles, see "Permissions" in Service Overview.

          6. Log in to the console and verify permissions.

            Log in to the console using the created user and verify permissions of the user.

            -
            • Choose Service List > DataArts Studio. Locate a DataArts Studio instance and click Access. Check whether the workspace list is displayed.
            • Access a service module (for example, Management Center) to which your current user has been added and check whether you can perform the operations allowed for the workspace role assigned to you.
            +
            • Choose Service List > DataArts Studio. Locate a DataArts Studio instance and click Access. Check whether the workspace list is displayed.
            • Access a service module (for example, Management Center) to which your current user has been added and check whether you can perform the operations allowed for the workspace role assigned to you.

          @@ -31,3 +33,10 @@
        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0005.html b/docs/dataartsstudio/umn/dataartsstudio_01_0005.html new file mode 100644 index 000000000..9e5a3d81a --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0005.html @@ -0,0 +1,234 @@ + + +

        Data Sources Supported by DataArts Studio

        +

        Before using DataArts Studio, you need to select cloud services or databases as the data foundation, which provides storage and compute capabilities. DataArts Studio provides one-stop data development, governance, and services based on the data foundation.

        +

        Supported Data Sources

        This section describes the data sources supported by DataArts Studio modules other than DataArts Migration. Table 1 lists the data sources supported by each module.

        +

        Except DataArts Migration, all other modules use the data connections created in Management Center. (A data connection can be used in a module which was selected during the creation of the connection.) To connect to these data sources, go to the DataArts Studio console and choose Management Center to create data connections.

        +

        The data sources supported by the migration jobs in DataArts Migration are different from those supported by other modules, and are described in the DataArts Migration chapter.

        +
        + +
        + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
        Table 1 Data sources supported by DataArts Studio

        Data Source Type

        +

        Management Center

        +

        DataArts Factory

        +

        DWS

        +

        Supported

        +

        Supported

        +

        DLI

        +

        Supported

        +

        Supported

        +

        MRS HBase

        +

        Supported

        +

        Not supported

        +

        MRS Hive

        +

        Supported

        +

        Supported

        +

        MRS Kafka

        +

        Supported

        +

        Supported

        +

        MRS Spark

        +

        Supported

        +

        Supported

        +

        MRS ClickHouse

        +

        Supported

        +

        Supported

        +

        MRS Hetu

        +

        Supported

        +

        Supported

        +

        MRS Impala

        +

        Supported

        +

        Supported

        +

        MRS Doris

        +

        Supported

        +

        Supported

        +

        RDS for MySQL

        +

        Supported

        +

        Supported

        +

        RDS for PostgreSQL

        +

        Supported

        +

        Supported

        +

        RDS for SQL Server

        +

        Supported

        +

        Not supported

        +

        MySQL

        +

        Supported

        +

        Not supported

        +

        Oracle

        +

        Supported

        +

        Not supported

        +

        Host Connection

        +

        Supported

        +

        Supported

        +
        +
        +

        DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

        +
        +
        +

        Overview

        +
        + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
        Table 2 Data source overview

        Data Source Type

        +

        Description

        +

        DWS

        +

        DWS employs the shared-nothing architecture and massively parallel processing (MPP) engine. It is compatible with ANSI SQL 99, SQL 2003, and the PostgreSQL or Oracle database ecosystem, providing competitive solutions for analyzing petabytes of data in various industries.

        +

        DLI

        +

        DLI is a serverless big data compute and analysis service that is fully compatible with Apache Spark and Apache Flink ecosystems. With multi-model engines supported by DLI, enterprises can use SQL statements or programs to easily complete batch processing, stream processing, in-memory computing, and machine learning of heterogeneous data sources.

        +

        MRS HBase

        +

        HBase undertakes data storage. It is an open-source, column-oriented, distributed storage system that is suitable for storing massive amounts of unstructured or semi-structured data. It features high reliability, high performance, and flexible scalability, and supports real-time data read/write.

        +

        MRS HBase stores massive amount of data and supports data queries in milliseconds. MRS HBase can load and update logistics data in milliseconds, and query and analyze petabytes of time series data in seconds.

        +

        MRS Hive

        +

        Hive is a mechanism that can store, query, and analyze large-scale data stored in Hadoop. Hive defines simple SQL-like query language, which is known as HiveQL. It allows a user familiar with SQL to query data.

        +

        MRS Hive can be used to analyze terabytes or petabytes of data and quickly migrate on-premises Hadoop big data platforms (such as CDH and HDP) to the cloud without service interruption and service code modification.

        +

        MRS Kafka

        +

        MRS provides dedicated MRS Kafka clusters. Kafka is an open-source, distributed, partitioned, and replicated commit log service. Kafka is publish-subscribe messaging, rethought as a distributed commit log. It provides features similar to Java Message Service (JMS) but another design. It features message endurance, high throughput, distributed methods, multi-client support, and real time. It applies to both online and offline message consumption, such as regular message collection, website activeness tracking, aggregation of statistical system operation data (monitoring data), and log collection. These scenarios engage large amounts of data collection for Internet services.

        +

        MRS Spark

        +

        Spark is an open-source parallel data processing framework. It helps users easily develop unified big data applications and perform cooperative processing, stream processing, and interactive analysis on data.

        +

        Spark provides a framework featuring fast calculation, write, and interactive query. Spark has obvious advantages over Hadoop in terms of performance. Spark provides the Spark SQL language similar to SQL statements to process structured data.

        +

        MRS ClickHouse

        +

        ClickHouse is an open-source columnar database oriented to online analysis and processing. It is independent of the Hadoop big data system and features ultimate compression rate and fast query performance. In addition, ClickHouse supports SQL query and provides good query performance, especially the aggregation analysis and query performance based on large and wide tables. The query speed is one order of magnitude faster than that of other analytical databases.

        +

        ClickHouse is widely used in various fields such as Internet advertising, apps, web, telecommunications, finance, and IoT. It suits business intelligence ideally.

        +

        MRS Impala

        +

        Impala provides fast, interactive SQL queries directly on your Apache Hadoop data stored in HDFS, HBase, or the Object Storage Service (OBS). In addition to using the same unified storage platform, Impala also uses the same metadata, SQL syntax (Hive SQL), ODBC driver, and user interface (Impala query UI in Hue) as Apache Hive. This provides a familiar and unified platform for real-time or batch-oriented queries. Impala is an addition to tools available for querying big data. Impala does not replace the batch processing frameworks built on MapReduce such as Hive. Hive and other frameworks built on MapReduce are best suited for long running batch jobs.

        +

        MRS Hudi

        +

        Hudi is a data lake table format that provides the ability to update and delete data as well as consume new data on HDFS. It supports multiple compute engines and provides insert, update, and delete (IUD) interfaces and streaming primitives, including upsert and incremental pull, over datasets on HDFS.

        +

        Hudi metadata is stored in Hive, and operations are performed using Spark.

        +

        MRS Doris

        +

        Doris is a high-performance, real-time analytical database. It can return query results of mass data in sub-seconds and can support high-concurrency point queries and high-throughput complex analysis. Apache Doris can meet requirements in report analysis, instant query, unified data warehouse building, and data lake federated query.

        +

        RDS

        +

        RDS is an online, out-of-the-box relational database service that is based on the cloud computing platform. It is stable, reliable, scalable, and easy to manage.

        +

        MySQL

        +

        MySQL is one of the most popular open-source databases. It features excellent performance, uses mature and stable architecture, supports popular applications, adapts to multiple fields and industries, and supports various web applications. It is cost-effective and preferred by small- and medium-sized enterprises.

        +

        Oracle

        +

        Oracle is a group of software that mainly applied to the distributed database. The Oracle database is one of the most popular Client/Server (C/S) and Browser/Server (B/S) databases.

        +

        It is also the most widely used database management system in the world. As a general database system, the Oracle database provides complete data management functions. As a relational database, it provides complete relational models. As a distributed database, it implements distributed data processing.

        +

        Rest Client

        +

        The Rest Client can be used to execute RESTful requests that are authenticated using IAM tokens or usernames and passwords.

        +

        Host Connection

        +

        You can connect to a specified host during data development and execute shell or Python scripts on the host through script development and job development. If the host connection information changes, you only need to edit it on the Host Connections page, but do not need to edit it in scripts or jobs one by one.

        +
        +
        +
        +
        +
        + +
        + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0005_0.html b/docs/dataartsstudio/umn/dataartsstudio_01_0005_0.html deleted file mode 100644 index 0cb6365cc..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0005_0.html +++ /dev/null @@ -1,228 +0,0 @@ - - -

        Data Sources

        -

        Before using DataArts Studio, you need to select cloud services or databases as the data lake foundation, which provides storage and compute capabilities. DataArts Studio provides one-stop data development, governance, and services based on the data lake foundation.

        -

        Data Sources Supported By DataArts Studio

        DataArts Studio can interconnect with cloud services such as DWS, DLI, and MRS Hive as well as traditional databases such as MySQL and . For details, see Table 1.

        -

        To connect to these data sources, go to the DataArts Studio console and choose Management Center to create a data connection.

        -

        The data connections in DataArts Studio Management Center are used to connect to the data lake foundation. DataArts Studio provides one-stop data development, governance, and services based on the data lake foundation.

        -
        - -
        - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
        Table 1 Data sources supported by DataArts Studio

        Data Source Type

        -

        Management Center

        -

        DataArts Factory

        -

        DWS

        -

        Supported

        -

        Supported

        -

        DLI

        -

        Supported

        -

        Supported

        -

        MRS HBase

        -

        Supported

        -

        Not supported

        -

        MRS Hive

        -

        Supported

        -

        Supported

        -

        MRS Kafka

        -

        Supported

        -

        Supported

        -

        MRS Spark

        -

        Supported

        -

        Supported

        -

        MRS ClickHouse

        -

        Supported

        -

        Supported

        -

        MRS Hetu

        -

        Supported

        -

        Supported

        -

        MRS Impala

        -

        Supported

        -

        Supported

        -

        MRS Doris

        -

        Supported

        -

        Supported

        -

        RDS for MySQL

        -

        Supported

        -

        Supported

        -

        RDS for PostgreSQL

        -

        Supported

        -

        Supported

        -

        MySQL

        -

        Supported

        -

        Not supported

        -

        Oracle

        -

        Supported

        -

        Not supported

        -

        Host Connection

        -

        Supported

        -

        Supported

        -
        -
        -

        DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

        -
        -
        -

        Overview

        -
        - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
        Table 2 Data source overview

        Data Source Type

        -

        Description

        -

        DWS

        -

        DWS employs the shared-nothing architecture and massively parallel processing (MPP) engine. It is compatible with ANSI SQL 99, SQL 2003, and the PostgreSQL or Oracle database ecosystem, providing competitive solutions for analyzing petabytes of data in various industries.

        -

        DLI

        -

        DLI is a serverless big data compute and analysis service that is fully compatible with Apache Spark and Apache Flink ecosystems. With multi-model engines supported by DLI, enterprises can use SQL statements or programs to easily complete batch processing, stream processing, in-memory computing, and machine learning of heterogeneous data sources.

        -

        MRS HBase

        -

        HBase undertakes data storage. It is an open-source, column-oriented, distributed storage system that is suitable for storing massive amounts of unstructured or semi-structured data. It features high reliability, high performance, and flexible scalability, and supports real-time data read/write.

        -

        MRS HBase stores massive amount of data and supports data queries in milliseconds. MRS HBase can load and update logistics data in milliseconds, and query and analyze petabytes of time series data in seconds.

        -

        MRS Hive

        -

        Hive is a mechanism that can store, query, and analyze large-scale data stored in Hadoop. Hive defines simple SQL-like query language, which is known as HiveQL. It allows users familiar with SQL to query data.

        -

        MRS Hive can be used to analyze terabytes or petabytes of data and quickly migrate on-premises Hadoop big data platforms (such as CDH and HDP) to the cloud without service interruption and service code modification.

        -

        MRS Kafka

        -

        MRS provides dedicated MRS Kafka clusters. Kafka is an open-source, distributed, partitioned, and replicated commit log service. Kafka is publish-subscribe messaging, rethought as a distributed commit log. It provides features similar to Java Message Service (JMS) but another design. It features message endurance, high throughput, distributed methods, multi-client support, and real time. It applies to both online and offline message consumption, such as regular message collection, website activeness tracking, aggregation of statistical system operation data (monitoring data), and log collection. These scenarios engage large amounts of data collection for Internet services.

        -

        MRS Spark

        -

        Spark is an open-source parallel data processing framework. It helps users easily develop unified big data applications and perform cooperative processing, stream processing, and interactive analysis on data.

        -

        Spark provides a framework featuring fast calculation, write, and interactive query. Spark has obvious advantages over Hadoop in terms of performance. Spark provides the Spark SQL language similar to SQL statements to process structured data.

        -

        MRS ClickHouse

        -

        ClickHouse is an open-source columnar database oriented to online analysis and processing. It is independent of the Hadoop big data system and features ultimate compression rate and fast query performance. In addition, ClickHouse supports SQL query and provides good query performance, especially the aggregation analysis and query performance based on large and wide tables. The query speed is one order of magnitude faster than that of other analytical databases.

        -

        ClickHouse is widely used in various fields such as Internet advertising, apps, web, telecommunications, finance, and IoT. It suits business intelligence ideally.

        -

        MRS Impala

        -

        Impala provides fast, interactive SQL queries directly on your Apache Hadoop data stored in HDFS, HBase, or the Object Storage Service (OBS). In addition to using the same unified storage platform, Impala also uses the same metadata, SQL syntax (Hive SQL), ODBC driver, and user interface (Impala query UI in Hue) as Apache Hive. This provides a familiar and unified platform for real-time or batch-oriented queries. Impala is an addition to tools available for querying big data. Impala does not replace the batch processing frameworks built on MapReduce such as Hive. Hive and other frameworks built on MapReduce are best suited for long running batch jobs.

        -

        MRS Hudi

        -

        Hudi is a data lake table format that provides the ability to update and delete data as well as consume new data on HDFS. It supports multiple compute engines and provides insert, update, and delete (IUD) interfaces and streaming primitives, including upsert and incremental pull, over datasets on HDFS.

        -

        Hudi metadata is stored in Hive, and operations are performed using Spark.

        -

        MRS Doris

        -

        Doris is a high-performance, real-time analytical database. It can return query results of mass data in sub-seconds and can support high-concurrency point queries and high-throughput complex analysis. Apache Doris can meet requirements in report analysis, instant query, unified data warehouse building, and data lake federated query.

        -

        RDS

        -

        RDS is an online, out-of-the-box relational database service that is based on the cloud computing platform. It is stable, reliable, scalable, and easy to manage.

        -

        Currently, DataArts Studio supports only MySQL and PostgreSQL databases in RDS.

        -

        MySQL

        -

        MySQL is one of the most popular open-source databases. It features excellent performance, uses mature and stable architecture, supports popular applications, adapts to multiple fields and industries, and supports various web applications. It is cost-effective and preferred by small- and medium-sized enterprises.

        -

        Oracle

        -

        Oracle is a group of software that mainly applied to the distributed database. The Oracle database is one of the most popular Client/Server (C/S) and Browser/Server (B/S) databases.

        -

        It is also the most widely used database management system in the world. As a general database system, the Oracle database provides complete data management functions. As a relational database, it provides complete relational models. As a distributed database, it implements distributed data processing.

        -

        Rest Client

        -

        The Rest Client can be used to execute RESTful requests that are authenticated using IAM tokens or usernames and passwords.

        -

        Host Connection

        -

        You can connect to a specified host during data development and execute shell or Python scripts on the host through script development and job development. If the host connection information changes, you only need to edit it on the Host Connections page, but do not need to edit it in scripts or jobs one by one.

        -
        -
        -
        -
        -
        - -
        - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0006.html b/docs/dataartsstudio/umn/dataartsstudio_01_0006.html deleted file mode 100644 index 254b2d28a..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0006.html +++ /dev/null @@ -1,28 +0,0 @@ - - -

        (Optional) Obtaining Authentication Information

        -

        When using DataArts Studio, for example, when creating OBS links, calling APIs, or locating issues, you may need to obtain information such as access keys, project IDs, and endpoints. This section describes how to obtain such information.

        -

        Obtaining an Access Key

        To obtain an access key, perform the following steps:
        1. Log in to the TICS console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
        2. On the My Credentials page, choose Access Keys > Create Access Key. See Figure 1.
          Figure 1 Clicking Create Access Key
          -
        3. Click OK and save the access key file when prompted. The access key file is saved to the default download location in your browser. Open the credentials.csv file to view the access key with an AK and SK.
          • Only two access keys can be added for each user.
          • For security purposes, access keys are automatically downloaded only when they are generated for the first time and cannot be obtained from the console later. Keep them properly.
          -
          -
        -
        -
        -

        Obtaining a Project ID and Account ID

        A project is a group of tenant resources, and an account ID corresponds to the current account. The IAM ID corresponds to the current user. You can view the project IDs, account IDs, and user IDs in different regions on the corresponding pages.
        1. Register with and log in to the management console.
        2. Hover the cursor on the username in the upper right corner and select My Credentials from the drop-down list.
        3. On the API Credentials page, obtain the account name, account ID, IAM username, and IAM user ID, and obtain the project ID from the project list.
        -
        -
        -

        Obtaining the DataArts Studio Instance ID and Workspace ID

        You can obtain them from the URI on the DataArts Studio console.
        1. On the homepage of the DataArts Studio console, select a workspace, and click a module, for example, Management Center.
        2. On the Management Center page, obtain the values of instanceId and workspace in the browser address bar, which are the DataArts Studio instance ID and workspace ID, respectively.
          As shown in Figure 2, the instance ID is 6b88…2688, and the workspace ID is 1dd3bc…d93f0.
          Figure 2 Obtaining the instance ID and workspace ID
          -
          -
        -
        -
        -

        Obtaining an Endpoint

        An endpoint is the request address for calling an API. Endpoints vary depending on services and regions.

        -

        You can obtain endpoints from Regions and Endpoints.

        -
        -
        -
        - -
        - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0008.html b/docs/dataartsstudio/umn/dataartsstudio_01_0008.html index a6c849a98..087e8b31f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0008.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0008.html @@ -5,15 +5,17 @@
      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0009.html b/docs/dataartsstudio/umn/dataartsstudio_01_0009.html index 110647302..2b1187594 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0009.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0009.html @@ -1,36 +1,42 @@ -

      Managing Data Connections

      +

      Configuring DataArts Studio Data Connection Parameters

      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0010.html b/docs/dataartsstudio/umn/dataartsstudio_01_0010.html index 73d7980f2..d4e0b1611 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0010.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0010.html @@ -1,32 +1,31 @@ -

      Migrating Resources

      +

      Configuring DataArts Studio Resource Migration

      To migrate resources in one workspace to another, you can use the resource migration function provided by DataArts Studio.

      -

      Resources that can be migrated include the data connections in Management Center.

      -

      Prerequisites

      • Resources can be imported from OBS or a local path.
      • There are resources that can be migrated. For details on how to create data connections, see Managing Data Connections.
      +
      Resources can be imported from OBS or a local path. Resources that can be migrated include the following service data:
      • Data connections created in Management Center
      • CDM jobs created in DataArts Migration, including the links in jobs
      • Scripts and jobs that have been submitted in DataArts Factory. By default, when jobs are exported, their dependent scripts and resources are not exported.
      -

      Constraints

      • Only an exported .zip file can be imported. During the import, the system verifies the resources in the file.
      • For security concerns, passwords of connections are not exported when the connections are exported. You need to enter the passwords when importing the connections.
      • The size of the file to be imported from an OBS bucket or local path cannot exceed 10 MB.
      +

      Constraints

      • Only an exported .zip file can be imported. During the import, the system verifies the resources in the file.
      • For security concerns, passwords of connections are not exported when the connections are exported. You need to enter the passwords when importing the connections.
      • The file to be imported from an OBS bucket or local path cannot be larger than 10 MB.
      -

      Exporting a Resource

      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
      2. On the DataArts Studio console, locate a workspace and click Management Center.
      3. In the navigation pane, choose Migrate Resources.

        Figure 1 Migrating Resources
        +

        Exporting a Resource

        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
        2. On the DataArts Studio console, locate a workspace and click Management Center.
        3. In the navigation pane, choose Migrate Resources.

          Figure 1 Migrating Resources

          -

        4. Click Create Export Task to configure the file name and the OBS path for saving the file. If OBS is unavailable, you only need to set the file name.

          Figure 2 Export Task
          +

        5. Click Export Task to configure the file name and the OBS path for saving the file. If OBS is unavailable, you only need to set the file name.

          Figure 2 Export Task

        6. Click Next and select the resources to export.

          -

        7. Click Next and wait until the export is complete. The resource package is exported to the OBS path you have set.

          Figure 3 Export completed
          +

        8. Click Next and wait until the export is complete. The resource package is exported to the OBS path you have set.

          Figure 3 Export completed

          If no result is displayed in 1 minute, the export fails. Try again. If the failure persists, contact the customer service or technical support.

          -

        9. After the export is complete, you can click Download in the row of the corresponding migration task to download the exported resource package.

          Figure 4 Downloading the exported result
          +

        10. After the export is complete, you can click Download in the row of the corresponding migration task to download the exported resource package.

          Figure 4 Downloading the exported result

        -

        Importing a Resource

        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
        2. On the DataArts Studio console, locate a workspace and click Management Center.
        3. In the navigation pane, choose Migrate Resources.

          Figure 5 Migrating Resources
          +

          Importing a Resource

          1. In the navigation pane, choose Migrate Resources.

            Figure 5 Migrating Resources

            -

          2. Click Create Import Task. On the displayed page, select an import mode and set the OBS bucket and path or local path that stores resources. The resource to be imported must be a .zip file exported from the console.

            Figure 6 Configuring the path that stores the resources to be imported
            +

          3. Click Import File. On the displayed page, select an import mode and set the OBS bucket and path or local path that stores resources. The resource to be imported must be a .zip file exported from the console.

            Figure 6 Configuring the path that stores the resources to be imported

            -

          4. Click Create Import Task and upload a .zip resource file that you have exported.
          5. Click Next and select the resources to import.

            -

          6. If you select DataSource, click Next to configure a data connection.

            Figure 7 Configuring a data connection
            -

          7. Click Next and wait until the import task is delivered. When the import task is delivered successfully, the system displays message "Import task started."

            Figure 8 Import task started
            +

          8. Click Import File and upload resources. a .zip resource file that you have exported.
          9. Click Next and select the resources to import.

            +

          10. If you select DataSource, click Next to configure a data connection.

            Figure 7 Configuring a data connection
            +

          11. Click Next and wait until the import task is delivered. When the import task is delivered successfully, the system displays message "Import task started."

            Figure 8 Import task started

            -

          12. Click OK. You can view the import result in the resource migration task list.

            Subtasks that fail are marked in red. You can click their names to view the failure causes.
            Figure 9 Viewing the import result
            +

          13. Click OK. You can view the import result in the resource migration task list.

            Subtasks that fail are marked in red. You can click their names to view the failure causes.
            Figure 9 Viewing the import result

          @@ -38,3 +37,10 @@
        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0012.html b/docs/dataartsstudio/umn/dataartsstudio_01_0012.html index 559117984..5d4927075 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0012.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0012.html @@ -1,20 +1,22 @@ -

        DataArts Migration

        +

        DataArts Migration (CDM Jobs)

      Data Sources Supported by Table/File Migration

      Table/File migration can migrate data in tables or files.

      Table 1 describes the supported data sources. -
      Table 1 Supported data sources during table/file migration

      Category

      +
      - - - - - - - - - - - - @@ -100,23 +101,23 @@ - - - - - - - - - - - - - - - - - - - - - - - - -
      Table 1 Supported data sources during table/file migration

      Category

      Source

      +

      Source

      Destination

      +

      Destination

      Description

      +

      Description

      Data warehouse

      +

      Data warehouse

      Data Warehouse Service

      +

      Data Warehouse Service

      • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), and MRS ClickHouse
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • Object-based storage: Object Storage Service (OBS)
      • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)
      +
      • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), and MRS ClickHouse
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • Object-based storage: Object Storage Service (OBS)
      • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)

      The DWS physical machine management mode is not supported.

      +

      The DWS physical machine management mode is not supported.

      Data Lake Insight (DLI)

      @@ -31,27 +31,28 @@
      • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), and MRS ClickHouse
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • Object-based storage: Object Storage Service (OBS)
      • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
      • NoSQL: CloudTable and MongoDB
      • Search: Elasticsearch and Cloud Search Service (CSS)

      Recommended MongoDB version: 4.2

      +

      You must have the SELECT permission (for querying tables) on all fields of the DLI data source.

      MRS ClickHouse

      Data warehouse: MRS ClickHouse and Data Lake Insight (DLI)

      • Recommended MRS ClickHouse version: 21.3.4.X
      • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

        +
      • Recommended MRS ClickHouse version: 21.3.4.X
      • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

      Hadoop

      +

      Hadoop

      MRS HDFS

      +

      MRS HDFS

      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • Object-based storage: Object Storage Service (OBS)
      • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)
      +
      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • Object-based storage: Object Storage Service (OBS)
      • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)
      • Supported by local storage. Only MRS Hive and MRS Hudi are supported in storage-compute decoupling scenarios.
      • Only MRS Hive is supported in Ranger scenarios.
      • Not supported if SSL is enabled for ZooKeeper
      • Recommended MRS HDFS versions:
        • 2.8.X
        • 3.1.X
        +
      • Supported by local storage. Only MRS Hive and MRS Hudi are supported in storage-compute decoupling scenarios.
      • Only MRS Hive is supported in Ranger scenarios.
      • Not supported if SSL is enabled for ZooKeeper
      • Recommended MRS HDFS versions:
        • 2.8.X
        • 3.1.X
      • Recommended MRS HBase versions:
        • 2.1.X
        • 1.3.X
      • MRS Hive and MRS Hudi 2.x versions are not supported. The following versions are recommended:
        • 1.2.X
        • 3.1.X
        -
      • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

        +
      • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

      Apache HDFS

      Object storage

      +

      Object storage

      Object Storage Service (OBS)

      +

      Object Storage Service (OBS)

      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)
      +
      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)
      • Object Storage Migration Service (OMS) is recommended for migration between object storage services.
      • Binary files cannot be imported to a database or NoSQL.
      +
      • Object Storage Migration Service (OMS) is recommended for migration between object storage services.
      • Binary files cannot be imported to a database or NoSQL.

      File system

      +

      File system

      FTP

      +

      FTP

      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)
      • Object-based storage: Object Storage Service (OBS)
      +
      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)
      • Object-based storage: Object Storage Service (OBS)
      • The file system cannot serve as the destination.
      • Only text files such as CSV files can be migrated from FTP or SFTP servers to search services. Binary files cannot.
      • Only binary files can be migrated from FTP or SFTP servers to OBS.
      • obsutil is recommended for migrating data from HTTP servers to OBS.
      +
      • The file system cannot serve as the destination.
      • Only text files such as CSV files can be migrated from FTP or SFTP servers to search services. Binary files cannot.
      • Only binary files can be migrated from FTP or SFTP servers to OBS.
      • obsutil is recommended for migrating data from HTTP servers to OBS.

      SFTP

      @@ -127,13 +128,13 @@

      Hadoop: MRS HDFS

      Relational database

      +

      Relational database

      RDS for MySQL

      +

      RDS for MySQL

      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, MRS Hive, and MRS Hudi
      • Object-based storage: Object Storage Service (OBS)
      • NoSQL: CloudTable
      • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
      • Search: Elasticsearch and Cloud Search Service (CSS)
      +
      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, MRS Hive, and MRS Hudi
      • Object-based storage: Object Storage Service (OBS)
      • NoSQL: CloudTable
      • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
      • Search: Elasticsearch and Cloud Search Service (CSS)
      • You are advised to use Data Replication Service (DRS) to migrate data between OLTP databases.
      • Recommended Microsoft SQL Server version: 2005 or later
      +
      • Recommended Microsoft SQL Server version: 2005 or later

      RDS for SQL Server

      @@ -184,13 +185,13 @@

      -

      NoSQL

      +

      NoSQL

      Distributed Cache Service (DCS)

      +

      Distributed Cache Service (DCS)

      Hadoop: MRS HDFS, MRS HBase, and MRS Hive

      +

      Hadoop: MRS HDFS, MRS HBase, and MRS Hive

      NoSQL except CloudTable cannot serve as the destination.

      +

      NoSQL except CloudTable cannot serve as the destination.

      Redis

      @@ -212,15 +213,15 @@
      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • Object-based storage: Object Storage Service (OBS)
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)

      Message system

      +

      Message system

      Apache Kafka

      +

      Apache Kafka

      Search: Cloud Search Service (CSS)

      +

      Search: Cloud Search Service (CSS)

      The message system cannot serve as the destination.

      +

      The message system cannot serve as the destination.

      DMS Kafka

      @@ -230,18 +231,18 @@
      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • Object-based storage: Object Storage Service (OBS)
      • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)
      • MRS Kafka cannot serve as the destination.
      • Supported only by local storage and not in storage-compute decoupling scenarios.
      • Not supported by Ranger.
      • Not supported if SSL is enabled for ZooKeeper.
      • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

        +
      • MRS Kafka cannot serve as the destination.
      • Supported only by local storage and not in storage-compute decoupling scenarios
      • Not supported by Ranger
      • Not supported if SSL is enabled for ZooKeeper
      • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

      Search

      +

      Search

      Elasticsearch

      +

      Elasticsearch

      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • Object-based storage: Object Storage Service (OBS)
      • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)
      +
      • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
      • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
      • Object-based storage: Object Storage Service (OBS)
      • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
      • NoSQL: CloudTable
      • Search: Elasticsearch and Cloud Search Service (CSS)

      Only the non-security mode is supported.

      +

      Only the non-security mode is supported.

      Cloud Search Service (CSS)

      @@ -294,7 +295,7 @@

      Entire DB migration only to MRS HBase

      Recommended versions:
      • 2.1.X
      • 1.3.X
      -

      MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

      +

      MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

      MRS Hive

      @@ -306,7 +307,7 @@

      Entire DB migration only to a relational database

      2.x versions are not supported. The following versions are recommended:
      • 1.2.X
      • 3.1.X
      -

      MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

      +

      MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

      FusionInsight HBase

      @@ -358,9 +359,9 @@

      Supported

      Supported only by local storage and in storage-compute decoupling scenarios

      -

      2.x versions are not supported. The following versions are recommended:

      +

      2.x versions are not supported. The following versions are recommended:

      • 1.2.X
      • 3.1.X
      -

      MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

      +

      MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

      Relational database

      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0015.html b/docs/dataartsstudio/umn/dataartsstudio_01_0015.html index 7786c8cc8..7c46faf87 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0015.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0015.html @@ -1,11 +1,11 @@ -

      Constraints

      -

      CDM System Constraints

      1. You cannot modify the flavor of an existing cluster. If you require a higher flavor, create a cluster with your desired flavor.
      2. Arm CDM clusters do not support agents. The CDM cluster version (Arm or x86) is determined by the architecture of underlying resources.
      3. CDM does not support the function of controlling the data migration speed. Therefore, do not perform data migration during peak hours.
      4. During data migration, CDM imposes pressure on the data source. You are advised to create a database account for data migration and configure an account policy to reduce the resource consumption of the data source. For example, you can configure a policy to delete the connections of the account when the CPU usage exceeds 30% to prevent impact on services.
      5. The baseline and maximum bandwidths of the NIC of the cdm.large CDM instance is 0.8 Gbit/s and 3 Gbit/s, respectively. The theoretical maximum volume of data that can be transmitted per instance per day is about 8 TB. Similarly, the baseline and maximum bandwidths of the NIC of the cdm.xlarge instance are 4 Gbit/s and 10 Gbit/s, respectively, and the theoretical maximum volume of data that can be transmitted per instance per day is about 40 TB. The baseline and maximum bandwidths of the NIC of the cdm.4xlarge instance is 36 Gbit/s and 40 Gbit/s, respectively, and the theoretical maximum volume of data that can be transmitted per instance per day is about 360 TB. You can use multiple CDM instances if you want faster data transfer.

        The actual amount of data that can be migrated in a day depends on the data source type, the read and write performance of the source and destination, and the actual available bandwidth. Typically you can migrate as much as 8 TB per day (large file migration to OBS) using the cdm.large instance. It is recommended that you test the speed with a small amount of data before migration.

        +

        Notes and Constraints

        +

        CDM System Notes and Constraints

        1. You cannot modify the flavor of an existing cluster. If you require a higher flavor, create a cluster with your desired flavor.
        2. The CDM cluster version (Arm or x86) is determined by the architecture of underlying resources.
        3. CDM does not support the function of controlling the data migration speed. Therefore, do not perform data migration during peak hours.
        4. During data migration, CDM imposes pressure on the data source. You are advised to create a database account for data migration and configure an account policy to reduce the resource consumption of the data source. For example, you can configure a policy to delete the connections of the account when the CPU usage exceeds 30% to prevent impact on services.
        5. The baseline and maximum bandwidths of the NIC of the cdm.large CDM instance is 0.8 Gbit/s and 3 Gbit/s, respectively. The theoretical maximum volume of data that can be transmitted per instance per day is about 8 TB. Similarly, the baseline and maximum bandwidths of the NIC of the cdm.xlarge instance are 4 Gbit/s and 10 Gbit/s, respectively, and the theoretical maximum volume of data that can be transmitted per instance per day is about 40 TB. The baseline and maximum bandwidths of the NIC of the cdm.4xlarge instance is 36 Gbit/s and 40 Gbit/s, respectively, and the theoretical maximum volume of data that can be transmitted per instance per day is about 360 TB. You can use multiple CDM instances if you want faster data transfer.

          The actual amount of data that can be migrated in a day depends on the data source type, the read and write performance of the source and destination, and the actual available bandwidth. Typically you can migrate as much as 8 TB per day (large file migration to OBS) using the cdm.large instance. It is recommended that you test the speed with a small amount of data before migration.

        6. CDM supports incremental file migration (by skipping repeated files), but does not support resumable transfer.

          For example, if three files are to be migrated and the second file fails to be migrated due to the network fault. When the migration task is started again, the first file is skipped. The second file, however, cannot be migrated from the point where the fault occurs, but can only be migrated again.

        7. During file migration, a single task supports millions of files. If there are too many files in the directory to be migrated, you are advised to split the files into different directories and create multiple tasks.
        8. You can export links and jobs configured on CDM to a local directory. To ensure password security, CDM does not export the link password of the corresponding data source. Therefore, before importing job configurations to CDM, you need to manually input the password in the exported JSON file or configure the password in the import dialog box.
        9. The cluster cannot automatically upgrade to a new version. You need to use the job export and import functions to upgrade the cluster to the new version.
        10. If OBS is unavailable, CDM does not automatically back up users' job configurations. You need to export and back up configuration data using the export function.
        11. If VPC peering connection is configured, the peer VPC subnet may overlap with the CDM management network. As a result, data sources in the peer VPC cannot be accessed. You are advised to use the public network for cross-VPC data migration, or contact the administrator to add specific routes to the VPC peering connection in the CDM background.
        12. If the destination of a CDM job is a DWS or NewSQL database, constraints of the source end, such as the primary key and unique index, cannot be migrated together.
        13. When performing a CDM job, ensure that the JSON file formats of the two clusters are the same so that jobs can be imported from the source cluster to the destination cluster.
        14. If a running job is interrupted unexpectedly, the data that has been written to the destination will not be deleted. You must manually delete the data if needed.
        15. The size of a file to be transferred cannot exceed 1 TB.
        -

        General Constraints on Database Migration

        1. CDM is mainly used for batch migration. It supports only limited incremental migration but does not support real-time incremental migration.
        2. The entire DB migration of CDM supports only data table migration but not migration of database objects such as stored procedures, triggers, functions, and views.

          CDM applies only to scenarios where databases are migrated to the cloud at a time, including homogeneous and heterogeneous database migrations. CDM is not applicable to data synchronization, for example, disaster recovery and real-time synchronization.

          +

          General Notes and Constraints on Database Migration

          1. CDM is mainly used for batch migration. It supports only limited incremental migration but does not support real-time incremental migration.
          2. The entire DB migration of CDM supports only data table migration but not migration of database objects such as stored procedures, triggers, functions, and views.

            CDM applies only to scenarios where databases are migrated to the cloud at a time, including homogeneous and heterogeneous database migrations. CDM is not applicable to data synchronization, for example, disaster recovery and real-time synchronization.

          3. If CDM fails to migrate an entire database or table, the data that has been imported to the target table will not be rolled back automatically. If you want to perform migration in transaction mode, configure the Import to Staging Table parameter to enable a rollback upon a migration failure.

            In extreme cases, the created stage table or temporary table cannot be automatically deleted. You need to manually clear the table (the name of the stage table ends with _cdm_stage), for example, cdmtet_cdm_stage).

          4. If CDM needs to access data sources in the on-premises data center (for example, the on-premises MySQL database), the data sources must support Internet access and the CDM instances must be bound with elastic IP addresses. In this case, the security practice is to configure the firewall or security policies to allow only the EIPs of the CDM instances to access the local data sources.
          5. Only common data types are supported, including character strings, digits, and dates. Object types are limited. If objects are too large, migration cannot be performed.
          6. Only the GBK and UTF-8 character sets are supported.
          7. A field name cannot contain & or %.
          8. jdbc2hive and hive2jdbc entire DB migration is implemented by field name mapping, and is unavailable if the source and destination field names are inconsistent.
          @@ -14,7 +14,7 @@

        Constraints on FusionInsight HD and Apache Hadoop

        If the FusionInsight HD and Apache Hadoop data sources are deployed in the on-premises data center, CDM must access all nodes in the cluster for reading and writing the Hadoop files. Therefore, the network access must be enabled for each node.

        -

        Constraints on DWS and FusionInsight LibrA

        1. If the DWS primary key or table contains only one field, the field type must be a common character string, value, or date. When data is migrated from another database to DWS, if automatic table creation is selected, the primary key must be of the following types. If no primary key is set, at least one of the following fields must be set. Otherwise, the table cannot be created and the CDM job fails.
          • INTEGER TYPES: TINYINT, SMALLINT, INT, BIGINT, NUMERIC/DECIMAL
          • CHARACTER TYPES: CHAR, BPCHAR, VARCHAR, VARCHAR2, NVARCHAR2, TEXT
          • DATA/TIME TYPES: DATE, TIME, TIMETZ, TIMESTAMP, TIMESTAMPTZ, INTERVAL, SMALLDATETIME
          +

          Constraints on GaussDB(DWS)

          1. If the DWS primary key or table contains only one field, the field type must be a common character string, value, or date. When data is migrated from another database to DWS, if automatic table creation is selected, the primary key must be of the following types. If no primary key is set, at least one of the following fields must be set. Otherwise, the table cannot be created and the CDM job fails.
            • INTEGER TYPES: TINYINT, SMALLINT, INT, BIGINT, NUMERIC/DECIMAL
            • CHARACTER TYPES: CHAR, BPCHAR, VARCHAR, VARCHAR2, NVARCHAR2, TEXT
            • DATA/TIME TYPES: DATE, TIME, TIMETZ, TIMESTAMP, TIMESTAMPTZ, INTERVAL, SMALLDATETIME

            For clusters of version 2.9.1.200 or earlier, the NVARCHAR2 data type is not supported for DWS.

          2. In DWS, the character string '' is null. A null character string cannot be inserted into a field with non-null constraints. This is inconsistent with the MySQL behavior. MySQL does not consider that '' is null. Migration from MySQL to DWS may fail due to the preceding reason.
          3. When the Gauss Data Service (GDS) mode is used to quickly import data to DWS, you need to configure a security group or firewall policy to allow DataNodes of DWS or FusionInsight LibrA to access port 25000 of the CDM IP address.
          4. When data is imported to DWS in GDS mode, CDM automatically creates a foreign table for data import. The table name ends with a universally unique identifier (UUID), for example, cdmtest_aecf3f8n0z73dsl72d0d1dk4lcir8cd. If a job fails, it will be automatically deleted. In extreme cases, you may need to manually delete it.
          @@ -70,7 +70,7 @@ STORED AS TEXTFILE;
          diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0017.html b/docs/dataartsstudio/umn/dataartsstudio_01_0017.html index c417f5c24..609b584e0 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0017.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0017.html @@ -1,27 +1,27 @@ -

          Managing Clusters

          +

          Creating and Managing a CDM Cluster

          diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0018.html b/docs/dataartsstudio/umn/dataartsstudio_01_0018.html index 9134d7a01..06550090d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0018.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0018.html @@ -15,7 +15,7 @@
        diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0020_0.html b/docs/dataartsstudio/umn/dataartsstudio_01_0020_0.html deleted file mode 100644 index fb8e763d9..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0020_0.html +++ /dev/null @@ -1,20 +0,0 @@ - - -

        Binding or Unbinding an EIP

        -

        Scenario

        After creating a CDM cluster, you can bind an EIP to or unbind an EIP from the cluster.

        -

        If CDM needs to access a local or Internet data source, or a cloud service in another VPC, bind an EIP to the CDM cluster or use a NAT gateway to enable the CDM cluster to share the EIP with ECSs to access the Internet.

        -

        If SSL encryption is configured for the access channel of a local data source, CDM cannot connect to the data source using the EIP.

        -
        -
        -

        Prerequisites

        • You have created a CDM cluster.
        • Your EIP quota is sufficient.
        -
        -

        Procedure

        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
        2. Bind an EIP to or unbind an EIP from a cluster.

          • Binding an EIP: In the Operation column, click Bind EIP. The Bind EIP dialog box is displayed.
          • Unbinding an EIP: In the Operation column, choose More > Unbind EIP.
          -

        3. Click Yes.
        -
        -
        -
        - -
        - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0021_0.html b/docs/dataartsstudio/umn/dataartsstudio_01_0021_0.html deleted file mode 100644 index 140f1422b..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0021_0.html +++ /dev/null @@ -1,27 +0,0 @@ - - -

        Viewing Basic Cluster Information and Modifying Cluster Configurations

        -

        Scenario

        After creating a CDM cluster, you can view its basic information and modify its configurations.

        -
        • You can view the following basic cluster information:
          • Cluster information: cluster version, creation time, project ID, instance ID, and cluster ID
          • Instance configuration: cluster flavor, CPU, and memory
          • Network configuration
          -
        • You can modify the following cluster configurations:
          • Notification: If a CDM migration job (only table/file migration) fails or the EIP is abnormal, CDM sends an SMS or email notification to the user.
          • User isolation: determines whether other users can operate the migration jobs or links in the cluster.
            • If this function is enabled, migration jobs and links in the cluster are isolated. Other IAM users of the a cloud platform account cannot operate the jobs and links.
            • If this function is disabled, migration jobs and links in the cluster can be shared by users. All IAM users with the required permission in the a cloud platform account can view and perform operations on the jobs and links in the cluster.

              After disabling User Isolation, restart the cluster VM for the settings to take effect.

              -
            -
          -
        -
        -

        Prerequisites

        You have created a CDM cluster.

        -
        -

        Viewing Basic Cluster Information

        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
        2. Click the cluster name to view its basic information.

          -

        -
        -

        Modifying Cluster Configurations

        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
        1. Click the name of a cluster and click the Cluster Configuration tab to modify Notification and User Isolation configuration.

          -

        2. Click Save. The Cluster Management page is displayed.
        3. If User Isolation is disabled, choose More > Restart in the Operation column to restart the cluster VM for the settings to take effect.

          Figure 1 Restarting a cluster
          -
          • Restart CDM service process: Only the CDM service process is restarted. The cluster VM will not be restarted.
          • VM restart: The service process will be interrupted and VMs in the cluster will be restarted.
          -

        4. Select VM restart and click Yes.
        -
        -
        -
        - -
        - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0022.html b/docs/dataartsstudio/umn/dataartsstudio_01_0022.html index 1b1994e1e..63e972e77 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0022.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0022.html @@ -1,17 +1,24 @@ -

        Downloading Cluster Logs

        +

        Downloading CDM Cluster Logs

        Scenario

        This section describes how to obtain cluster logs to view the job running history and locate job failure causes.

        Prerequisites

        You have created a CDM cluster.

        -

        Procedure

        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
        1. Locate the row that contains a cluster, click More in the Operation column, and select Download Log from the drop-down list.

          Figure 1 Download Log
          +

          Procedure

          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
          1. Locate the row that contains a cluster, click More in the Operation column, and select Download Log from the drop-down list.

            Figure 1 Download Log

          2. In the displayed dialog box, click OK to download logs to a local PC.
        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0023.html b/docs/dataartsstudio/umn/dataartsstudio_01_0023.html index d6852a722..2f21e2cd2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0023.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0023.html @@ -1,73 +1,21 @@ -

        Managing Links

        +

        Creating a Link in a CDM Cluster

        diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0024.html b/docs/dataartsstudio/umn/dataartsstudio_01_0024.html index 0e3fca6b7..39e585336 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0024.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0024.html @@ -1,17 +1,17 @@ -

        Creating Links

        +

        Creating a Link Between CDM and a Data Source

        Scenario

        Before creating a data migration job, create a link to enable the CDM cluster to read data from and write data to a data source. A migration job requires a source link and a destination link. For details on the data sources that can be exported (source links) and imported (destination links) in different migration modes (table/file migration), see Supported Data Sources.

        The link configurations depend on the data source. This section describes how to create these links.

        Constraints

        • If changes occur in the connected data source (for example, the MRS cluster capacity is expanded), you need to edit and save the connection.
        • Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.
        -

        Prerequisites

        • A CDM cluster is available.
        • The CDM cluster can communicate with the destination data source.
          • If the destination data source is an on-premises database, you need the Internet or Direct Connect. When using the Internet, ensure that an EIP has been bound to the CDM cluster, the security group of CDM allows outbound traffic from the host where the off-cloud data source is located, the host where the data source is located can access the Internet, and the connection port has been enabled in the firewall rules.
          • If the destination data source is a cloud service (such as DWS, MRS, and ECS), the following requirements must be met for network interconnection:
            • If the CDM cluster and the cloud service are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, the host where the data source is located can access the Internet, and the port has been enabled in the firewall rules.
            • If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
            • The cloud service instance and the CDM cluster belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
            +

            Prerequisites

            • A CDM cluster is available.
            • The CDM cluster can communicate with the destination data source.
              • If the destination data source is an on-premises database, you need the Internet or Direct Connect. When using the Internet, ensure that an EIP has been bound to the CDM cluster, the security group of CDM allows outbound traffic from the host where the off-cloud data source is located, the host where the data source is located can access the Internet, and the connection port has been enabled in the firewall rules.
              • If the destination data source is a cloud service (such as DWS, MRS, and ECS), the following requirements must be met for network interconnection:
                • If the CDM cluster and the cloud service are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, the host where the data source is located can access the Internet, and the port has been enabled in the firewall rules.
                • If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                • The cloud service instance and the CDM cluster belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
              -
            • You have obtained the URL and the account for accessing the data source. The account is granted with the read and write permissions for the data source.
            • When using the Agent, you need to use the main account to grant the CDM operation permission to the sub-account.
            +
          • You have obtained the URL and the account for accessing the data source. The account is granted with the read and write permissions for the data source.
        -

        Creating Links

        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
        2. On the CDM console, choose Cluster Management in the left navigation pane. Locate the row that contains the target cluster and click Job Management in the Operation column. On the displayed Links page, click Create Link. On the displayed page, select a connector.

          The connectors are classified based on the type of the data source to be connected. All supported data types are displayed.

          -
          Figure 1 Selecting a connector type
          +

          Creating Links

          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
          2. On the CDM console, choose Cluster Management in the left navigation pane. Locate the row that contains the target cluster and click Job Management in the Operation column. On the displayed Links page, click Create Link. On the displayed page, select a connector.

            The connectors are classified based on the type of the data source to be connected. All supported data types are displayed.

            +
            Figure 1 Selecting a connector type

          3. Select a data source and click Next. The following describes how to create a MySQL link.

            The link parameters of different data sources vary. Table 1 describes the link parameters.
            @@ -21,62 +21,62 @@ - - - - - - - - - - - - - - - - - - - - - - + + + - @@ -159,7 +166,14 @@
            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0025.html b/docs/dataartsstudio/umn/dataartsstudio_01_0025.html index 76ed24d7d..48bc46aab 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0025.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0025.html @@ -1,8 +1,8 @@

            How Migration Jobs Work

            -

            Data Migration Model

            Figure 1 shows the simplified migration model used by CDM.

            -
            Figure 1 Migration model used by CDM
            +

            Data Migration Model

            Figure 1 shows the simplified migration model used by CDM.

            +
            Figure 1 Migration model used by CDM
            CDM migrates data through data migration jobs. It works in the following way:
            1. When data migration jobs are submitted, CDM splits each job into multiple tasks based on the Concurrent Extractors parameter in the job configuration.

              Jobs for different data sources may be split based on different dimensions. Some jobs may not be split based on the Concurrent Extractors parameter.

            2. CDM submits the tasks to the running pool in sequence. Tasks (defined by Maximum Concurrent Extractors) run concurrently. Excess tasks are queued.
            @@ -74,3 +74,10 @@
            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0026.html b/docs/dataartsstudio/umn/dataartsstudio_01_0026.html index 5647f3a79..ab120dd9f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0026.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0026.html @@ -1,13 +1,14 @@ -

            Link to Hive

            +

            Hive Link Parameters

            CDM supports the following Hive data sources:

            MRS Hive

            You can view a table during field mapping only when you have the permission to access the table connected to MRS Hive.

            MRS Hive links apply to the MapReduce Service (MRS) on cloud. Table 1 describes related parameters.

            -
            • Before creating an MRS Hive link, you need to add an authenticated Kerberos user on MRS and log in to the MRS management page to change the initial password. Then use the new user to create an MRS link.
            • To connect to an MRS 2.x cluster, create a CDM cluster of version 2.x first. CDM 1.8.x clusters cannot connect to MRS 2.x clusters.
            • Currently, the Hive link obtains the core-site.xml configuration information from MRS HDFS. Therefore, if MRS Hive uses OBS as the underlying storage system, configure the AK/SK of OBS on MRS HDFS before creating the Hive link.
            • Ensure that the MRS cluster and the DataArts Studio instance can communicate with each other. The following requirements must be met for network interconnection:
              • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
              • If the CDM cluster in the DataArts Studio instance and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see Security Group > Adding a Security Group Rule in Virtual Private Cloud (VPC) Usage Guide.
              • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
              +
              • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                +
              • Before creating an MRS Hive link, you need to add an authenticated Kerberos user on MRS and log in to the MRS management page to change the initial password. Then use the new user to create an MRS link.
              • To connect to an MRS 2.x cluster, create a CDM cluster of version 2.x first. CDM 1.8.x clusters cannot connect to MRS 2.x clusters.
              • Currently, the Hive link obtains the core-site.xml configuration information from MRS HDFS. Therefore, if MRS Hive uses OBS as the underlying storage system, configure the AK/SK of OBS on MRS HDFS before creating the Hive link.
              • Ensure that the MRS cluster and the DataArts Studio instance can communicate with each other. The following requirements must be met for network interconnection:
                • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
              @@ -28,7 +29,7 @@
            - @@ -77,7 +78,7 @@ - - @@ -343,8 +344,8 @@ @@ -359,7 +360,7 @@ @@ -398,7 +399,14 @@
            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0027.html b/docs/dataartsstudio/umn/dataartsstudio_01_0027.html index d1672dead..af589d236 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0027.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0027.html @@ -1,6 +1,6 @@ -

            Link to CloudTable

            +

            CloudTable Link Parameters

            When connecting CDM to CloudTable, configure the parameters as described in Table 1.

            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

            @@ -80,7 +80,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0028.html b/docs/dataartsstudio/umn/dataartsstudio_01_0028.html index bc9226973..29442a76d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0028.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0028.html @@ -1,6 +1,6 @@ -

            Link to an FTP or SFTP Server

            +

            FTP/SFTP Link Parameters

            The FTP/SFTP link is used to migrate files from the on-premises file server or ECS to a database.

            • Only FTP servers running Linux are supported.
            • Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.
            @@ -48,6 +48,14 @@
            + + + +
            Table 1 Link parameters

            Connector

            • RDS for PostgreSQL
            • RDS for SQL Server
            • PostgreSQL
            • Microsoft SQL Server

            Because the JDBC drivers used by these relational databases are the same, the parameters to be configured are also the same and are described in Link to PostgreSQL/SQLServer.

            +

            Because the JDBC drivers used by these relational databases are the same, the parameters to be configured are also the same and are described in PostgreSQL/SQLServer Link Parameters.

            Data Warehouse Service

            For details about the parameters, see Link to DWS.

            +

            For details about the parameters, see GaussDB(DWS) Link Parameters.

            SAP HANA

            For details about the parameters, see Link to SAP HANA.

            +

            For details about the parameters, see SAP HANA Link Parameters.

            MySQL

            For details about the parameters, see Link to an RDS for MySQL/MySQL Database.

            +

            For details about the parameters, see RDS for MySQL/MySQL Database Link Parameters.

            Oracle

            For details about the parameters, see Link to an Oracle Database.

            +

            For details about the parameters, see Oracle Database Link Parameters.

            Database Sharding

            For details about the parameters, see Link to a Database Shard.

            +

            For details about the parameters, see Shard Link Parameters.

            Object Storage Service (OBS)

            For details about the parameters, see Link to OBS.

            +

            For details about the parameters, see OBS Link Parameters.

            • MRS HDFS
            • FusionInsight HDFS
            • Apache HDFS

            If the data source is HDFS of MRS, Apache Hadoop, or FusionInsight HD, see Link to HDFS.

            +

            If the data source is HDFS of MRS, Apache Hadoop, or FusionInsight HD, see HDFS Link Parameters.

            • MRS HBase
            • FusionInsight HBase
            • Apache HBase

            If the data source is HBase of MRS, Apache Hadoop, or FusionInsight HD, see Link to HBase.

            +

            If the data source is HBase of MRS, Apache Hadoop, or FusionInsight HD, see HBase Link Parameters.

            • MRS Hive
            • FusionInsight Hive
            • Apache Hive

            If the data source is Hive on MRS, Apache Hadoop, or FusionInsight HD, see Link to Hive.

            +

            If the data source is Hive on MRS, Apache Hadoop, or FusionInsight HD, see Hive Link Parameters.

            CloudTable Service

            If the data source is CloudTable, see Link to CloudTable.

            +

            If the data source is CloudTable, see CloudTable Link Parameters.

            • FTP
            • SFTP

            If the data source is an FTP or SFTP server, see Link to an FTP or SFTP Server.

            +

            If the data source is an FTP or SFTP server, see FTP/SFTP Link Parameters.

            HTTP

            @@ -87,58 +87,65 @@

            MongoDB

            If the data source is a local MongoDB, see Link to MongoDB.

            +

            If the data source is a local MongoDB, see MongoDB Link Parameters.

            Document Database Service (DDS)

            If the data source is DDS, see Link to DDS.

            +

            If the data source is DDS, see DDS Link Parameters.

            • Redis
            • Distributed Cache Service

            If the data source is Redis or DCS, see Link to Redis.

            +

            If the data source is Redis or DCS, see Redis Link Parameters.

            • MRS Kafka
            • Apache Kafka

            If the data source is MRS Kafka or Apache Kafka, see Link to Kafka.

            +

            If the data source is MRS Kafka or Apache Kafka, see Kafka Link Parameters.

            Cloud Search Service (CSS)

            Elasticsearch

            If the data source is CSS or Elasticsearch, see Link to CSS.

            +

            If the data source is CSS or Elasticsearch, see CSS Link Parameters.

            Data Lake Insight

            If the data source is DLI, see Link to DLI.

            +

            If the data source is DLI, see DLI Link Parameters.

            DMS Kafka

            If the data source is DMS Kafka, see Link to DMS Kafka.

            +

            If the data source is DMS Kafka, see DMS Kafka Link Parameters.

            Cassandra

            If the data source is Cassandra, see Link to Cassandra.

            +

            If the data source is Cassandra, see Cassandra Link Parameters.

            +
            NOTE:

            Cassandra is not supported in version 2.9.3.300 or later.

            +

            MRS Hudi

            For details about the parameters, see Link to MRS Hudi.

            +

            For details about the parameters, see MRS Hudi Link Parameters.

            MRS ClickHouse

            For details about the parameters, see Link to MRS ClickHouse.

            +

            For details about the parameters, see MRS ClickHouse Link Parameters.

            +

            LogHub (SLS)

            +

            For details about the parameters, see LogHub (SLS) Link Parameters.

            Shentong database

            For details about the parameters, see Link to a ShenTong Database.

            +

            For details about the parameters, see ShenTong Database Link Parameters.

            Manager IP

            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
            NOTE:

            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

            +
            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
            NOTE:

            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

            ldapUsername

            This parameter is mandatory when Enable ldap is enabled.

            +

            This parameter is mandatory when Enable ldap is enabled.

            Enter the username configured when LDAP authentication was enabled for MRS Hive.

            -

            @@ -85,7 +86,7 @@

            ldapPassword

            This parameter is mandatory when Enable ldap is enabled.

            +

            This parameter is mandatory when Enable ldap is enabled.

            Enter the password configured when LDAP authentication was enabled for MRS Hive.

            -

            @@ -102,7 +103,7 @@

            This parameter is mandatory when OBS storage support is enabled. The account corresponding to the AK/SK pair must have the OBS Buckets Viewer permission. Otherwise, OBS cannot be accessed and the "403 AccessDenied" error is reported.

            You need to create an access key for the current account and obtain an AK/SK pair.

            -
            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
              Figure 1 Clicking Create Access Key
              +
              1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
              2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
                Figure 1 Clicking Create Access Key
              3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                NOTE:
                • Only two access keys can be added for each user.
                • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
              @@ -233,8 +234,8 @@

            This parameter is mandatory when OBS storage support is enabled. The account corresponding to the AK/SK pair must have the OBS Buckets Viewer permission. Otherwise, OBS cannot be accessed and the "403 AccessDenied" error is reported.

            You need to create an access key for the current account and obtain an AK/SK pair.

            -
            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
              Figure 2 Clicking Create Access Key
              -
            3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
              NOTE:
              • Only two access keys can be added for each user.
              • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
              +
              1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
              2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 2.
                Figure 2 Clicking Create Access Key
                +
              3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                NOTE:
                • Only two access keys can be added for each user.
                • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.

            This parameter is mandatory when OBS storage support is enabled. The account corresponding to the AK/SK pair must have the OBS Buckets Viewer permission. Otherwise, OBS cannot be accessed and the "403 AccessDenied" error is reported.

            You need to create an access key for the current account and obtain an AK/SK pair.

            -
            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
              Figure 3 Clicking Create Access Key
              -
            3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
              NOTE:
              • Only two access keys can be added for each user.
              • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
              +
              1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
              2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 3.
                Figure 3 Clicking Create Access Key
                +
              3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                NOTE:
                • Only two access keys can be added for each user.
                • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.

            Run Mode

            This parameter is used only when the Hive version is HIVE_3_X. Possible values are:

            -
            • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
            • Standalone: The link instance runs in an independent process. If CDM needs to connect to multiple Hadoop data sources (MRS, Hadoop, or CloudTable) with both Kerberos and Simple authentication modes, Standalone prevails.
              NOTE:

              The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

              +
              • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
              • Standalone: The link instance runs in an independent process. If CDM needs to connect to multiple Hadoop data sources (MRS, Hadoop, or CloudTable) with both Kerberos and Simple authentication modes, Standalone prevails.
                NOTE:

                The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

            -

            FTP File Name controlEncoding

            +

            This parameter is available for a FTP link.

            +

            It indicates the controlEncoding file name encoding configuration of ftp-client. The value can be ISO-8859-1 or UFT8. The default value is ISO-8859-1.

            +

            ISO-8859-1

            +
            @@ -55,7 +63,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0030.html b/docs/dataartsstudio/umn/dataartsstudio_01_0030.html index 674abaefe..fdd9b05b9 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0030.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0030.html @@ -1,9 +1,9 @@ -

            Link to MongoDB

            +

            MongoDB Link Parameters

            This link is used to transfer data from a third-party cloud MongoDB service or MongoDB created in the on-premises data center or ECS to a big data platform.

            When connecting CDM to an on-premises MongoDB database, configure the parameters as described in Table 1.

            -

            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

            +
            • MongoDB data sources with SSL enabled are not supported.
            • Do not change the password or user when a job is running. If you do so, the password will not take effect immediately and the job will fail.
            - @@ -136,7 +136,7 @@ - @@ -222,7 +222,7 @@ - @@ -120,7 +120,7 @@ - @@ -207,7 +207,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0050.html b/docs/dataartsstudio/umn/dataartsstudio_01_0050.html index a6ffc3a21..c79d36902 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0050.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0050.html @@ -22,7 +22,7 @@ @@ -50,8 +52,8 @@ - @@ -105,7 +105,7 @@ - @@ -173,7 +173,7 @@ - - + + + +
            Table 1 MongoDB link parameters

            Parameter

            @@ -72,7 +72,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0031.html b/docs/dataartsstudio/umn/dataartsstudio_01_0031.html index 41f19f56c..c91717417 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0031.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0031.html @@ -1,9 +1,9 @@ -

            Link to DDS

            +

            DDS Link Parameters

            The DDS link is used to synchronize data from Document Database Service (DDS) on the cloud to a big data platform.

            When connecting CDM to DDS, configure the parameters as described in Table 1.

            -

            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

            +
            • DDS data sources with SSL enabled are not supported.
            • Do not change the password or user when a job is running. If you do so, the password will not take effect immediately and the job will fail.
            - @@ -64,9 +64,9 @@
            Table 1 DDS link parameters

            Parameter

            @@ -64,7 +64,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0032.html b/docs/dataartsstudio/umn/dataartsstudio_01_0032.html index 7b512ccdf..cc0f8ff42 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0032.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0032.html @@ -1,6 +1,6 @@ -

            Link to Redis

            +

            Redis Link Parameters

            The Redis link is applicable to data migration of Redis created in the local data center or ECS. It is used to load data in the database or files to Redis.

            Links to Redis data encrypted using SSL are not supported.

            When connecting CDM to an on-premises Redis database, configure the parameters as described in Table 1.

            @@ -84,7 +84,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0033.html b/docs/dataartsstudio/umn/dataartsstudio_01_0033.html index 428c4e94d..8e04cac37 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0033.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0033.html @@ -1,6 +1,6 @@ -

            Link to Kafka

            +

            Kafka Link Parameters

            MRS Kafka

            When connecting CDM to Kafka of MRS, configure the parameters as described in Table 1.

            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

            @@ -22,7 +22,7 @@

            Manager IP

            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
            NOTE:

            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

            +
            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
            NOTE:

            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

            - - @@ -92,7 +92,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0035.html b/docs/dataartsstudio/umn/dataartsstudio_01_0035.html index 3110c2d36..fb3ca8f78 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0035.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0035.html @@ -1,6 +1,6 @@ -

            Link to CSS

            +

            CSS Link Parameters

            Cloud Search Service (CSS) is a fully hosted distributed search service powered by open-source Elasticsearch. CSS links can be used to migrate log files and database records to CSS for search and analysis using Elasticsearch.

            • Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.
            @@ -52,7 +52,7 @@
            - @@ -63,7 +63,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0036.html b/docs/dataartsstudio/umn/dataartsstudio_01_0036.html index 40a243425..9b2b8dd5a 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0036.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0036.html @@ -1,8 +1,9 @@ -

            Link to DLI

            +

            DLI Link Parameters

            When connecting CDM to DLI, configure the parameters as described in Table 1.

            -

            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

            +
            • Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

              +
            • When data is migrated to DLI, DLI generates data files in the dli-trans* temporary OBS bucket. Therefore, you need to grant the user who uses the AK/SK the permissions to read and write the dli-trans* bucket and create directories. Otherwise, the migration will fail. For details about how to add permission policies for temporary bucket dli-trans*, see Adding an Authorization Policy for the dli-trans* Temporary Bucket.
            Table 2 Parameter description

            Parameter

            Description

            +

            Description

            Example Value

            +

            Example Value

            HTTPS Access

            This parameter is displayed when Security Mode Authentication is set to Yes. This parameter specifies whether to enable HTTPS access. HTTPS access is more secure than HTTP access.

            +

            This parameter is displayed when Security Mode Authentication is set to Yes. This parameter specifies whether to enable HTTPS access. HTTPS access is more secure than HTTP access.

            Yes

            + + + +
            Table 1 DLI link parameters

            Parameter

            @@ -24,7 +25,7 @@

            AK/SK required for authentication during access to the DLI database.

            You need to create an access key for the current account and obtain an AK/SK pair.

            -
            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
              Figure 1 Clicking Create Access Key
              +
              1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
              2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
                Figure 1 Clicking Create Access Key
              3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                NOTE:
                • Only two access keys can be added for each user.
                • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
              @@ -40,19 +41,110 @@

            Project ID

            Project ID in the region where DLI resides

            -
            A project is a group of tenant resources, and an account ID corresponds to the current account. The IAM ID corresponds to the current user. You can view the project IDs, account IDs, and user IDs in different regions on the corresponding pages.
            1. Register with and log in to the management console.
            2. Hover the cursor on the username in the upper right corner and select My Credentials from the drop-down list.
            3. On the API Credentials page, obtain the account name, account ID, IAM username, and IAM user ID, and obtain the project ID from the project list.
            +
            A project is a group of tenant resources, and an account ID corresponds to the current account. The IAM ID corresponds to the current user. You can view the project IDs, account IDs, and user IDs in different regions on the corresponding pages.
            1. Register with and log in to the management console.
            2. Hover the cursor on the username in the upper right corner and select My Credentials from the drop-down list.
            3. On the API Credentials page, obtain the account name, account ID, IAM username, and IAM user ID, and obtain the project and its ID from the project list.

            -

            Batch Size

            +

            Number of rows written each time. When the number of rows written reaches the value of Commit Size, the rows will be committed to the database.

            +

            50000

            +
            +

            Adding an Authorization Policy for the dli-trans* Temporary Bucket

            1. Log in to the IAM console.
            2. In the navigation pane, choose Permissions > Policies/Roles and click Create Custom Policy in the upper right corner.

              Figure 2 Creating a custom policy
              +

            3. On the Create Custom Policy page, select JSON for Policy View and create custom policy obs_dli-trans.

              {
              +    "Version": "1.1",
              +    "Statement": [
              +        {
              +            "Effect": "Allow",
              +            "Action": [
              +                "obs:object:GetObject",
              +                "obs:object:DeleteObjectVersion",
              +                "obs:bucket:GetBucketLocation",
              +                "obs:object:GetAccessLabel",
              +                "obs:bucket:PutEncryptionConfiguration",
              +                "obs:bucket:PutBucketStoragePolicy",
              +                "obs:object:DeleteAccessLabel",
              +                "obs:bucket:PutBucketCustomDomainConfiguration",
              +                "obs:bucket:GetLifecycleConfiguration",
              +                "obs:bucket:PutBucketInventoryConfiguration",
              +                "obs:bucket:DeleteDirectColdAccessConfiguration",
              +                "obs:object:AbortMultipartUpload",
              +                "obs:bucket:PutBucketLogging",
              +                "obs:bucket:DeleteBucketWebsite",
              +                "obs:object:DeleteObject",
              +                "obs:bucket:PutBucketVersioning",
              +                "obs:bucket:GetBucketWebsite",
              +                "obs:bucket:GetBucketLogging",
              +                "obs:bucket:DeleteBucketCustomDomainConfiguration",
              +                "obs:object:PutObject",
              +                "obs:object:RestoreObject",
              +                "obs:bucket:PutReplicationConfiguration",
              +                "obs:bucket:GetBucketQuota",
              +                "obs:object:GetObjectVersionAcl",
              +                "obs:bucket:DeleteBucket",
              +                "obs:bucket:CreateBucket",
              +                "obs:bucket:GetDirectColdAccessConfiguration",
              +                "obs:bucket:PutDirectColdAccessConfiguration",
              +                "obs:bucket:GetBucketAcl",
              +                "obs:bucket:GetBucketVersioning",
              +                "obs:bucket:GetBucketInventoryConfiguration",
              +                "obs:bucket:GetBucketStoragePolicy",
              +                "obs:bucket:GetEncryptionConfiguration",
              +                "obs:bucket:PutBucketCORS",
              +                "obs:bucket:PutBucketTagging",
              +                "obs:bucket:GetBucketTagging",
              +                "obs:bucket:PutLifecycleConfiguration",
              +                "obs:bucket:GetBucketCustomDomainConfiguration",
              +                "obs:object:ListMultipartUploadParts",
              +                "obs:object:ModifyObjectMetaData",
              +                "obs:bucket:ListBucketVersions",
              +                "obs:bucket:PutBucketQuota",
              +                "obs:object:PutAccessLabel",
              +                "obs:bucket:ListBucket",
              +                "obs:bucket:GetBucketCORS",
              +                "obs:bucket:DeleteBucketInventoryConfiguration",
              +                "obs:object:GetObjectVersion",
              +                "obs:bucket:PutBucketWebsite",
              +                "obs:bucket:DeleteReplicationConfiguration",
              +                "obs:object:GetObjectAcl",
              +                "obs:bucket:GetBucketNotification",
              +                "obs:bucket:PutBucketNotification",
              +                "obs:bucket:GetReplicationConfiguration",
              +                "obs:bucket:GetBucketPolicy",
              +                "obs:bucket:DeleteBucketTagging",
              +                "obs:bucket:GetBucketStorage"
              +            ],
              +            "Resource": [
              +                "OBS:*:*:object:*",
              +                "OBS:*:*:bucket:dli-trans*"
              +            ]
              +        }
              +    ]
              +}
              +
              Figure 3 Creating custom policy obs_dli-trans
              +

              +

            4. Click OK.
            5. In the navigation pane, choose User Groups, locate the user group to which the DLI link user using the AK/SK belongs, and click Authorize to assign the custom obs_dli-trans policy to the user.

              Figure 4 Assigning the custom obs_dli-trans policy to a user group
              +

              +

            +
            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0037.html b/docs/dataartsstudio/umn/dataartsstudio_01_0037.html index 591b9ebb8..419955d29 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0037.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0037.html @@ -1,6 +1,6 @@ -

            Link to CloudTable OpenTSDB

            +

            CloudTable OpenTSDB Link Parameters

            When connecting CDM to CloudTable OpenTSDB, configure the parameters as described in Table 1.

            - @@ -149,7 +153,7 @@ - - @@ -274,7 +278,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0040.html b/docs/dataartsstudio/umn/dataartsstudio_01_0040.html index 033b4fd7a..8980eb24b 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0040.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0040.html @@ -1,12 +1,16 @@ -

            Link to HDFS

            +

            HDFS Link Parameters

            CDM supports the following HDFS data sources:

            MRS HDFS

            When connecting CDM to HDFS of MRS, configure the parameters as described in Table 1.

            -
            • Before creating an MRS link, you need to add an authenticated Kerberos user on MRS and log in to the MRS management page to change the initial password. Then use the new user to create an MRS link.
            • To connect to an MRS 2.x cluster, create a CDM cluster of version 2.x first. CDM 1.8.x clusters cannot connect to MRS 2.x clusters.
            • If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
              • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
              • If the CDM cluster in the DataArts Studio instance and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
              • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
              +
              • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                +
              • Before creating an MRS link, you need to add an authenticated Kerberos user on MRS and log in to the MRS management page to change the initial password. Then use the new user to create an MRS link.
              • To connect to an MRS 2.x cluster, create a CDM cluster of version 2.x first. CDM 1.8.x clusters cannot connect to MRS 2.x clusters.
              • If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                +

                If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                +
                +
              @@ -27,7 +31,7 @@
            - @@ -61,17 +65,17 @@ - - @@ -159,8 +163,8 @@ - - @@ -227,8 +231,8 @@ - - @@ -272,7 +276,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0044.html b/docs/dataartsstudio/umn/dataartsstudio_01_0044.html index 9b7344f9c..e07473d23 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0044.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0044.html @@ -1,7 +1,7 @@ -

            Link to PostgreSQL/SQLServer

            -

            Table 1 lists the parameters for creating a link to PostgreSQL/SQLServer.

            +

            PostgreSQL/SQLServer Link Parameters

            +

            Table 1 lists the parameters for creating a link to PostgreSQL/SQLServer. Greenplum, Kingbase, and GaussDB can be connected through the PostgreSQL connector. The source and destination data sources supported by migration jobs are the same as those for PostgreSQL.

            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

            @@ -60,16 +60,31 @@
            - - - - + + + + + + + + + + + + + + + + - - - @@ -109,7 +140,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0045.html b/docs/dataartsstudio/umn/dataartsstudio_01_0045.html index e2d990928..465407c8c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0045.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0045.html @@ -1,6 +1,6 @@ -

            Link to OBS

            +

            OBS Link Parameters

            When connecting CDM to the destination OBS bucket, you need to add the read and write permissions to the destination OBS bucket, and file authentication is not required.

            • If the CDM cluster and OBS bucket are not in the same region, the CDM cluster cannot access the OBS bucket.
            • Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.
            @@ -27,7 +27,7 @@
            NOTE:
            • If the CDM cluster and OBS bucket are not in the same region, the CDM cluster cannot access the OBS bucket.
            • Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.
            -
            + + + +
            Table 1 CloudTable OpenTSDB link parameters

            Parameter

            @@ -36,7 +36,7 @@

            Project ID

            Project ID in the region where CloudTable resides

            -
            A project is a group of tenant resources, and an account ID corresponds to the current account. The IAM ID corresponds to the current user. You can view the project IDs, account IDs, and user IDs in different regions on the corresponding pages.
            1. Register with and log in to the management console.
            2. Hover the cursor on the username in the upper right corner and select My Credentials from the drop-down list.
            3. On the API Credentials page, obtain the account name, account ID, IAM username, and IAM user ID, and obtain the project ID from the project list.
            +
            A project is a group of tenant resources, and an account ID corresponds to the current account. The IAM ID corresponds to the current user. You can view the project IDs, account IDs, and user IDs in different regions on the corresponding pages.
            1. Register with and log in to the management console.
            2. Hover the cursor on the username in the upper right corner and select My Credentials from the drop-down list.
            3. On the API Credentials page, obtain the account name, account ID, IAM username, and IAM user ID, and obtain the project and its ID from the project list.

            -

            @@ -53,7 +53,7 @@

            AK and SK for accessing CloudTable.

            You need to create an access key for the current account and obtain an AK/SK pair.

            -
            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
              Figure 1 Clicking Create Access Key
              +
              1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
              2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
                Figure 1 Clicking Create Access Key
              3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                NOTE:
                • Only two access keys can be added for each user.
                • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
              @@ -72,7 +72,14 @@
              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0038.html b/docs/dataartsstudio/umn/dataartsstudio_01_0038.html index 585921cfe..b16f140ce 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0038.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0038.html @@ -1,6 +1,6 @@ -

              Link to DMS Kafka

              +

              DMS Kafka Link Parameters

              When connecting CDM to DMS Kafka, configure the parameters as described in Table 1.

              Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

              @@ -72,7 +72,7 @@
              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0039.html b/docs/dataartsstudio/umn/dataartsstudio_01_0039.html index 6c6de3cfa..05aa23976 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0039.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0039.html @@ -1,12 +1,16 @@ -

              Link to HBase

              +

              HBase Link Parameters

              CDM supports the following HBase data sources:

              MRS HBase

              When connecting CDM to HBase of MRS, configure the parameters as described in Table 1.

              -
              • Before creating an MRS link, you need to add an authenticated Kerberos user on MRS and log in to the MRS management page to change the initial password. Then use the new user to create an MRS link.
              • To connect to an MRS 2.x cluster, create a CDM cluster of version 2.x first. CDM 1.8.x clusters cannot connect to MRS 2.x clusters.
              • If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                • If the CDM cluster in the DataArts Studio instance and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                +
                • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                  +
                • Before creating an MRS link, you need to add an authenticated Kerberos user on MRS and log in to the MRS management page to change the initial password. Then use the new user to create an MRS link.
                • To connect to an MRS 2.x cluster, create a CDM cluster of version 2.x first. CDM 1.8.x clusters cannot connect to MRS 2.x clusters.
                • If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                  • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                  • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                  • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                  +

                  If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                  +
                  +
                @@ -27,7 +31,7 @@

            Manager IP

            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
            NOTE:

            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

            +
            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
            NOTE:

            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

            Authentication Method

            Authentication method used for accessing the cluster:
            • SIMPLE: Select this for non-security mode.
            • KERBEROS: Select this for security mode.
            +
            Authentication method used for accessing the cluster:
            • SIMPLE: Select this for non-security mode.
            • KERBEROS: Select this for security mode.

            Kerberos

            @@ -219,7 +223,7 @@

            Authentication Method

            Authentication method used for accessing the cluster:
            • SIMPLE: Select this for non-security mode.
            • KERBEROS: Select this for security mode.
            +
            Authentication method used for accessing the cluster:
            • SIMPLE: Select this for non-security mode.
            • KERBEROS: Select this for security mode.

            Kerberos

            @@ -244,7 +248,7 @@

            Run Mode

            Run mode of the HBase link. This parameter is used only when the HBase version is HBASE_2_X.

            -
            • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
            • Standalone: The link instance runs in an independent process. If CDM needs to connect to multiple Hadoop data sources (MRS, Hadoop, or CloudTable) with both Kerberos and Simple authentication modes, Standalone prevails.
              NOTE:

              The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

              +
              • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
              • Standalone: The link instance runs in an independent process. If CDM needs to connect to multiple Hadoop data sources (MRS, Hadoop, or CloudTable) with both Kerberos and Simple authentication modes, Standalone prevails.
                NOTE:

                The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

            Manager IP

            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
            NOTE:

            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

            +
            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
            NOTE:

            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

            Run Mode

            Run mode of the HDFS link. The options are as follows:
            • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
            • STANDALONE: The link instance runs in an independent process. If CDM needs to connect to multiple Hadoop data sources (MRS, Hadoop, or CloudTable) with both Kerberos and Simple authentication modes, select STANDALONE or configure different agents.

              Note: The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

              -
            • Agent: The link instance runs on an agent.
            +
            Run mode of the HDFS link. The options are as follows:
            • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
            • STANDALONE: The link instance runs in an independent process. If you want to connect CDM to multiple Hadoop data sources (MRS, Hadoop, or CloudTable), and both KERBEROS and SIMPLE authentication modes are available, you must select STANDALONE for this parameter.

              Note: The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

              +
            -

            If Agent is not used, and the CDM cluster connects to two or more clusters with Kerberos authentication enabled and the same realm, only one cluster can be connected in EMBEDDED mode, and the other clusters must be in STANDALONE mode.

            +

            If a CDM cluster connects to two or more clusters with Kerberos authentication enabled and the same realm, only one cluster can be connected in EMBEDDED mode, and the other clusters must be connected in STANDALONE mode.

            STANDALONE

            Agent

            Click Select and select the agent created in Connecting to an Agent. This parameter is displayed when Run Mode is set to Agent.

            +

            The agent function will be unavailable soon and does not need to be configured.

            -

            Run Mode

            Run mode of the HDFS link. The options are as follows:
            • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
            • STANDALONE: The link instance runs in an independent process. If CDM needs to connect to multiple Hadoop data sources (MRS, Hadoop, or CloudTable) with both Kerberos and Simple authentication modes, select STANDALONE or configure different agents.

              Note: The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

              -
            • Agent: The link instance runs on an agent.
            +
            Run mode of the HDFS link. The options are as follows:
            • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
            • STANDALONE: The link instance runs in an independent process. If you want to connect CDM to multiple Hadoop data sources (MRS, Hadoop, or CloudTable), and both KERBEROS and SIMPLE authentication modes are available, you must select STANDALONE for this parameter.

              Note: The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

              +

            STANDALONE

            @@ -168,7 +172,7 @@

            Agent

            Click Select and select the agent created in Connecting to an Agent. This parameter is displayed when Run Mode is set to Agent.

            +

            The agent function will be unavailable soon and does not need to be configured.

            -

            Run Mode

            Run mode of the HDFS link. The options are as follows:
            • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
            • STANDALONE: The link instance runs in an independent process. If CDM needs to connect to multiple Hadoop data sources (MRS, Hadoop, or CloudTable) with both Kerberos and Simple authentication modes, select STANDALONE or configure different agents.

              Note: The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

              -
            • Agent: The link instance runs on an agent. For Apache HDFS, you can select Agent only if Authentication Method is set to SIMPLE.
            +
            Run mode of the HDFS link. The options are as follows:
            • EMBEDDED: The link instance runs with CDM. This mode delivers better performance.
            • STANDALONE: The link instance runs in an independent process. If you want to connect CDM to multiple Hadoop data sources (MRS, Hadoop, or CloudTable), and both KERBEROS and SIMPLE authentication modes are available, you must select STANDALONE for this parameter.

              Note: The STANDALONE mode is used to solve the version conflict problem. If the connector versions of the source and destination ends of the same link are different, a JAR file conflict occurs. In this case, you need to place the source or destination end in the STANDALONE process to prevent the migration failure caused by the conflict.

              +

            STANDALONE

            @@ -245,7 +249,7 @@

            Agent

            This parameter is required when Authentication Method is set to SIMPLE and Run Mode is set to Agent. Select the agent created in Connecting to an Agent.

            +

            The agent function will be unavailable soon and does not need to be configured.

            -

            Use Agent

            Whether to extract data from the data source through an agent

            +

            The agent function will be unavailable soon and does not need to be configured.

            Yes

            +

            -

            Agent

            Click Select and select the agent created in Managing Agents.

            +

            The agent function will be unavailable soon and does not need to be configured.

            -

            +

            -

            +

            Driver Class Name

            +

            Class name of the uploaded driver

            +

            Select org.postgresql.Driver or com.kingbase8.Driver.

            +

            -

            +

            Reference Sign

            +

            (Optional) Delimiter between the names of the referenced tables or columns. For details, see the product documentation of the corresponding database.

            +

            "

            Driver Version

            @@ -87,20 +102,36 @@

            1000

            Commit Size

            +

            (Optional) Displayed when you click Show Advanced Attributes.

            +

            Number of records submitted each time. Set this parameter based on the destination and data size of the job. If the value is too large or too small, the job execution time may be affected.

            +

            10000

            +

            SSL Encryption

            +

            Whether to connect to the database in SSL mode

            +

            Yes

            +

            Link Attributes

            (Optional) Click Add to add the JDBC connector attributes of multiple specified data sources. For details, see the JDBC connector document of the corresponding database.

            -
            The following are some examples:
            • connectTimeout=60 and socketTimeout=300: When a large amount of data needs to be migrated or the entire table is retrieved using query statements, the migration fails due to connection timeout. In this case, you can customize the connection timeout interval (s) and socket timeout interval (s) to prevent failures caused by timeout.
            • useCursorFetch=false: By default, useCursorFetch is enabled, indicating that the JDBC connector communicates with relational databases using a binary protocol. Some third-party systems may have compatibility issues, causing migration time conversion errors. In this case, you can disable this function.
            • trustServerCertificate=true: A PKIX error may be reported during the creation of a secure connection. You are advised to set this parameter to true.
            +
            The following are some examples:
            • connectTimeout=60 and socketTimeout=300: When a large amount of data needs to be migrated or the entire table is retrieved using query statements, the migration fails due to connection timeout. In this case, you can customize the connection timeout interval (s) and socket timeout interval (s) to prevent failures caused by timeout.
            • useCursorFetch=false: By default, useCursorFetch is enabled, indicating that the JDBC connector communicates with relational databases using a binary protocol. Some third-party systems may have compatibility issues, causing migration time conversion errors. In this case, you can disable this function.
            • trustServerCertificate=true: A PKIX error may be reported during the creation of a secure connection. You are advised to set this parameter to true.
            • sslmode=require: The link to PostgreSQL may fail when SSL authentication is enabled. Set this parameter to require.

            sslmode=require

            Reference Sign

            +

            Link Secret Attributes

            (Optional) Delimiter between the names of the referenced tables or columns. For details, see the product documentation of the corresponding database.

            +

            (Optional) Displayed when you click Show Advanced Attributes.

            +

            Custom secret attributes of the link

            "

            +

            sk=09fUgD5WOF1L6f

            -

            +

            obs.myregion.mycloud.com

            Port

            @@ -48,7 +48,7 @@

            AK and SK are used to log in to the OBS server.

            You need to create an access key for the current account and obtain an AK/SK pair.

            -
            To obtain an access key, perform the following steps:
            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
              Figure 1 Clicking Create Access Key
              +
              To obtain an access key, perform the following steps:
              1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
              2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
                Figure 1 Clicking Create Access Key
              3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                NOTE:
                • Only two access keys can be added for each user.
                • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
              @@ -62,6 +62,17 @@

            -

            Link Attributes

            +

            (Optional) Displayed when you click Show Advanced Attributes.

            +

            You can click Add to add custom attributes for the link.

            +

            Only connectionTimeout, socketTimeout, and idleConnectionTime are supported.

            +

            The following are some examples:

            +
            • socketTimeout: timeout interval for data transmission at the socket layer, in milliseconds
            • connectionTimeout: timeout interval for establishing an HTTP/HTTPS connection, in milliseconds
            +

            -

            +
            @@ -69,7 +80,14 @@
            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_004501.html b/docs/dataartsstudio/umn/dataartsstudio_01_004501.html index a09a208aa..758110eba 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_004501.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_004501.html @@ -1,7 +1,7 @@ -

            Link to Cassandra

            -

            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

            +

            Cassandra Link Parameters

            +
            • Cassandra is not supported in version 2.9.3.300 or later.
            • Do not change the password or user when a job is running. If you do so, the password will not take effect immediately and the job will fail.
            - @@ -155,6 +157,13 @@ + + + + @@ -264,18 +275,19 @@

          4. After the parameters are configured, click Next. The Map Field tab page is displayed.

            If files are migrated between FTP, SFTP, OBS, and HDFS and the migration source's File Format is set to Binary, files will be directly transferred, free from field mapping.

            In other scenarios, CDM automatically maps fields of the source table and the destination table. You need to check whether the mapping and time format are correct. For example, check whether the source field type can be converted into the destination field type.

            -
            Figure 2 Field mapping
            -
            • If the fields from the source and destination do not match, you can drag the fields to make adjustments.
            • On the Map Field tab page, if CDM fails to obtain all columns by obtaining sample values (for example, when data is exported from HBase, CloudTable, or MongoDB, or when data is migrated from SFTP/FTP to DLI, there is a high probability that CDM failed to obtain all columns), you can click and select Add a new field to add new fields to ensure that the data imported to the migration destination is complete.
            • When a relational database, Hive, DLI, or MRS Hudi is used as the migration source, sample values cannot be obtained.
            • On the Map Field page, you can click to add custom constants, variables, and expressions.
            • Column names are displayed when the source of the migration job is OBS, CSV files are to be migrated, and parameter Extract first row as columns is set to Yes.
            • When SQLServer is the destination, fields of the timestamp type cannot be written. You must change their type (for example, to datatime) so that they can be written.
            • When Hive serves as the source, data of the array and map types can be read.
            • Field mapping is not involved when the binary format is used to migrate files to files.
            • If the data is imported to DWS, you need to select the distribution columns in the destination fields. You are advised to select the distribution columns according to the following principles:
              1. Use the primary key as the distribution column.
              2. If multiple data segments are combined as primary keys, specify all primary keys as the distribution column.
              3. In the scenario where no primary key is available, if no distribution column is selected, DWS uses the first column as the distribution column by default. As a result, data skew risks exist.
              +
              Figure 2 Field mapping
              +
              • If the fields from the source and destination do not match, you can drag the fields to make adjustments.
              • On the Map Field tab page, if CDM fails to obtain all columns by obtaining sample values (for example, when data is exported from HBase, CloudTable, or MongoDB, or when data is migrated from SFTP/FTP to DLI, there is a high probability that CDM failed to obtain all columns), you can click and select Add a new field to add new fields to ensure that the data imported to the migration destination is complete.
              • When a relational database, Hive, DLI, or MRS Hudi is used as the migration source, sample values cannot be obtained.
              • On the Map Field page, you can click to add custom constants, variables, and expressions.
              • Column names are displayed when the source of the migration job is OBS, CSV files are to be migrated, and parameter Extract first row as columns is set to Yes.
              • When SQLServer is the destination, fields of the timestamp type cannot be written. You must change their type (for example, to datatime) so that they can be written.
              • When Hive serves as the source, data of the array and map types can be read.
              • Field mapping is not involved when the binary format is used to migrate files to files.
              • If the data is imported to DWS, you need to select the distribution columns in the destination fields. You are advised to select the distribution columns according to the following principles:
                1. Use the primary key as the distribution column.
                2. If multiple data segments are combined as primary keys, specify all primary keys as the distribution column.
                3. In the scenario where no primary key is available, if no distribution column is selected, DWS uses the first column as the distribution column by default. As a result, data skew risks exist.
              -

            • CDM supports field conversion. Click and then click Create Converter.

              Figure 3 Creating a converter
              +

            • CDM supports field conversion. Click and then click Create Converter.

              Figure 3 Creating a converter
              +

              CDM supports the following converters:

              • Anonymization: hides key data in the character string.
                For example, if you want to convert 12345678910 to 123****8910, configure the parameters as follows:
                • Set Reserve Start Length to 3.
                • Set Reserve End Length to 4.
                • Set Replace Character to *.
              • Trim automatically deletes the spaces before and after the character string.
              • Reverse string automatically reverses a character string. For example, reverse ABC into CBA.
              • Replace string replaces the specified character string.
              • Expression conversion uses the JSP expression language (EL) to convert the current field or a row of data.
              • Remove line break deletes the newline characters, such as \n, \r, and \r\n from the field.

              If Use SQL Statement is set to Yes in the source job configuration, converters cannot be created.

              -

            • Click Next, set job parameters, and click Show Advanced Attributes to display and configure optional parameters.

              Figure 4 Task parameters
              +

            • Click Next, set job parameters, and click Show Advanced Attributes to display and configure optional parameters.

              Figure 4 Task parameters
              Table 3 describes related parameters.
          5. Table 1 Parameter description

            Parameter

            @@ -69,7 +69,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0046.html b/docs/dataartsstudio/umn/dataartsstudio_01_0046.html index ee5b2e959..649ec8e99 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0046.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0046.html @@ -5,9 +5,9 @@

            Constraints

            • The dirty data recording function depends on OBS.
            • The JSON file of a job to be imported cannot exceed 1 MB.
            • The size of a file to be transferred cannot exceed 1 TB.
            • Field names of the source and destination parameters cannot contain ampersands (&) or number signs (%).
            -

            Prerequisites

            • A link has been created. For details, see Creating Links.
            • The CDM cluster can communicate with the data source.
            +

            Prerequisites

            -

            Procedure

            1. Log in to the management console and choose Service List > Cloud Data Migration. In the left navigation pane, choose Cluster Management. Locate the target cluster and click Job Management.
            2. Choose Table/File Migration > Create Job. The page for configuring the job is displayed.

              Figure 1 Creating a migration job
              +

              Procedure

              1. Log in to the management console and choose Service List > Cloud Data Migration. In the left navigation pane, choose Cluster Management. Locate the target cluster and click Job Management.
              2. Choose Table/File Migration > Create Job. The page for configuring the job is displayed.

                Figure 1 Creating a migration job

              3. Select the source and destination links.

                • Job Name: Enter a string consisting of 1 to 240 characters. The name can contain digits, letters, hyphens (-), underscores (_), and periods (.), and cannot start with a hyphen (-) or period (.). An example value is oracle2rds_t.
                • Source Link Name: Select the data source from which data will be exported.
                • Destination Link Name: Select the data source to which data will be imported.

              4. Configure the source link parameters.

                The parameters vary with data sources. For details about the job parameters of other types of data sources, see Table 1 and Table 2.

                @@ -52,7 +52,7 @@

            Data can be exported from DLI.

            For details, see From DLI.

            +

            For details, see From DLI.

            • FTP
            • SFTP
            @@ -116,6 +116,8 @@
            • MongoDB
            • Document Database Service

            Data can be exported from MongoDB or DDS.

            +
            NOTE:

            MongoDB and DDS data sources with SSL enabled are not supported.

            +

            For details, see From MongoDB/DDS.

            For details, see From MRS ClickHouse.

            LogHub (SLS)

            +

            Data can be exported from LogHub (SLS).

            +

            For details, see From LogHub (SLS).

            +

            ShenTong database

            Data can be exported from a ShenTong database.

            @@ -255,6 +264,8 @@

            MongoDB

            Data can be rapidly imported to MongoDB.

            +
            NOTE:

            MongoDB data sources with SSL enabled are not supported.

            +

            For details, see To MongoDB.

            @@ -304,7 +316,7 @@ - @@ -313,7 +325,9 @@ - - @@ -378,7 +392,7 @@ - - - + + + +
            Table 3 Parameter description

            Parameter

            Schedule Execution

            If you select Yes, you can set the start time, cycle, and validity period of a job. For details, see Scheduling Job Execution.

            +

            If you select Yes, you can set the start time, cycle, and validity period of a job. For details, see Configuring a Scheduled CDM Job.

            NOTE:

            If you use DataArts Studio DataArts Factory to schedule the CDM migration job and configure this parameter, both configurations take effect. To ensure unified service logic and avoid scheduling conflicts, enable job scheduling in DataArts Factory and do not configure a scheduled task for the job in DataArts Migration.

            Concurrent Extractors

            Configure the number of tasks to be split from a CDM job.

            +

            Maximum number of threads of the job for reading data from the source

            +
            NOTE:

            The number of concurrent threads may be less than or equal to the value of this parameter for some data sources that do not support concurrent extraction, for example, CSS and ClickHouse.

            +
            CDM migrates data through data migration jobs. It works in the following way:
            1. When data migration jobs are submitted, CDM splits each job into multiple tasks based on the Concurrent Extractors parameter in the job configuration.
              NOTE:

              Jobs for different data sources may be split based on different dimensions. Some jobs may not be split based on the Concurrent Extractors parameter.

            2. CDM submits the tasks to the running pool in sequence. Tasks (defined by Maximum Concurrent Extractors) run concurrently. Excess tasks are queued.
            @@ -369,7 +383,7 @@

            Dirty Data Directory

            This parameter is displayed only when Write Dirty Data is set to Yes.

            +

            This parameter is displayed only when Write Dirty Data is set to Yes.

            Dirty data is stored in the directory for storing dirty data on OBS. Dirty data is saved only when this parameter is configured.

            You can go to this directory to query data that fails to be processed or is filtered out during job execution, and check the source data that does not meet conversion or cleaning rules.

            Max. Error Records in a Single Shard

            This parameter is displayed only when Write Dirty Data is set to Yes.

            +

            This parameter is displayed only when Write Dirty Data is set to Yes.

            When the number of error records of a single map exceeds the upper limit, the job will automatically terminate and the imported data cannot be rolled back. You are advised to use a temporary table as the destination table. After the data is imported, rename the table or combine it into the final data table.

            0

            @@ -393,20 +407,29 @@

            Yes

            Max. error records in a single shard

            +

            byteRate(MB/s)

            Maximum rate for a job. To configure throttling for multiple jobs, multiply the rate by the number of concurrent jobs.

            +

            Maximum read/write speed of the job

            +

            Throttling can be enabled for a job for migrating data to Hive, DLI, JDBC, OBS, or HDFS. If multiple concurrent jobs are allowed, the actual maximum speed can be calculated by the value of this parameter multiplied by the number of concurrent jobs.

            NOTE:

            The rate is an integer greater than 1.

            20

            Intermediate Queue Cache Size (MB)

            +

            Amount of data that the intermediate queue can cache. The value ranges from 1 to 500. The default value is 64.

            +

            If the amount of data of a row exceeds the value of this parameter, the migration may fail. If the value of this parameter is too large, the cluster may not run properly. Set an appropriate value for this parameter and use the default value (64) unless otherwise specified.

            +

            64

            +
            -

          6. Click Save or Save and Run. On the page displayed, you can view the job status.

            The job status can be New, Pending, Booting, Running, Failed, Succeeded, or Stopped.

            +

          7. Click Save or Save and Run. On the displayed page, you can view the job status.

            The job status can be New, Pending, Booting, Running, Failed, Succeeded, or Stopped.

            Pending indicates that the job is waiting to be scheduled by the system, and Booting indicates that the data to be migrated is being analyzed.

          8. @@ -414,7 +437,14 @@
            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0047.html b/docs/dataartsstudio/umn/dataartsstudio_01_0047.html index ab2c4066f..971b697a1 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0047.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0047.html @@ -1,6 +1,6 @@ -

            Source Job Parameters

            +

            Configuring CDM Source Job Parameters

            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0048.html b/docs/dataartsstudio/umn/dataartsstudio_01_0048.html index 17f385050..c5f564994 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0048.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0048.html @@ -29,7 +29,7 @@

            Directory or file path from which data will be extracted. You can enter a maximum of 50 file paths. By default, the file paths are separated by vertical bars (|). You can also customize a file separator.

            Directory from which data is to be migrated. All files (including all nested subdirectories and their subfiles) in the directory will be migrated.

            This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            FROM/example.csv

            @@ -77,7 +77,7 @@

            JSON Type

            This parameter is displayed only when File Format is set to JSON. Type of a JSON object stored in a JSON file. The options are JSON object and JSON array.

            +

            This parameter is displayed only when File Format is set to JSON. Type of a JSON object stored in a JSON file. The options are JSON object and JSON array.

            JSON object

            Use First N Rows as Header

            This parameter is displayed only when File Format is set to CSV. When you migrate a CSV file to a table, CDM writes all data to the table by default. If you set this parameter to Yes, CDM uses the first N rows of the CSV file as the heading row and does not write the row to the destination table.

            +

            This parameter is displayed only when File Format is set to CSV. When you migrate a CSV file to a table, CDM writes all data to the table by default. If you set this parameter to Yes, CDM uses the first N rows of the CSV file as the heading row and does not write the row to the destination table.

            No

            Directory Filter

            If you set Filter Type to Wildcard or Regex, enter a wildcard character to filter paths. The paths that meet the filtering condition are migrated. You can configure multiple paths separated by commas (,).

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            *input

            @@ -231,7 +231,7 @@

            File Filter

            If you set Filter Type to Wildcard or Regex, you can enter a wildcard character to search for files in a specified path. The files that meet the search criteria are migrated. You can configure multiple files separated by commas (,).

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            *.csv,*.txt

            @@ -248,7 +248,7 @@

            If you set Filter Type to Time Filter, and specify a point in time for this parameter, only the files modified at or after the specified time are transferred. The time format must be yyyy-MM-dd HH:mm:ss.

            This parameter can be set to a macro variable of date and time. For example, ${timestamp(dateformat(yyyy-MM-dd HH:mm:ss,-90,DAY))} indicates that only files generated within the latest 90 days are migrated.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            2019-06-01 00:00:00

            @@ -258,7 +258,7 @@

            If you set Filter Type to Time Filter, and specify a point in time for this parameter, only the files modified before the specified time are transferred. The time format must be yyyy-MM-dd HH:mm:ss.

            This parameter can be set to a macro variable of date and time. For example, ${timestamp(dateformat(yyyy-MM-dd HH:mm:ss))} indicates that only the files whose modification time is earlier than the current time are migrated.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            2019-07-01 00:00:00

            @@ -288,7 +288,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0049.html b/docs/dataartsstudio/umn/dataartsstudio_01_0049.html index 8d45b002c..07243fabf 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0049.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0049.html @@ -28,7 +28,7 @@

            Directory or file path from which data will be extracted.

            Directory from which data is to be migrated. All files (including all nested subdirectories and their subfiles) in the directory will be migrated.

            This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            /user/cdm/

            @@ -91,7 +91,7 @@

            Use First Row as Header

            This parameter is displayed only when File Format is set to CSV. When you migrate a CSV file to a table, CDM writes all data to the table by default. If you set this parameter to Yes, CDM uses the first N rows of the CSV file as the heading row and does not write the row to the destination table.

            +

            This parameter is displayed only when File Format is set to CSV. When you migrate a CSV file to a table, CDM writes all data to the table by default. If you set this parameter to Yes, CDM uses the first N rows of the CSV file as the heading row and does not write the row to the destination table.

            No

            Directory Filter

            If you set Filter Type to Wildcard or Regex, enter a wildcard character to filter paths. The paths that meet the filtering condition are migrated. You can configure multiple paths separated by commas (,).

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            *input

            @@ -129,7 +129,7 @@

            File Filter

            If you set Filter Type to Wildcard or Regex, you can enter a wildcard character to search for files in a specified path. The files that meet the search criteria are migrated. You can configure multiple files separated by commas (,).

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            *.csv

            @@ -146,7 +146,7 @@

            If you set Filter Type to Time Filter, and specify a point in time for this parameter, only the files modified at or after the specified time are transferred. The time format must be yyyy-MM-dd HH:mm:ss.

            This parameter can be set to a macro variable of date and time. For example, ${timestamp(dateformat(yyyy-MM-dd HH:mm:ss,-90,DAY))} indicates that only files generated within the latest 90 days are migrated.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            2019-07-01 00:00:00

            @@ -156,7 +156,7 @@

            If you set Filter Type to Time Filter, and specify a point in time for this parameter, only the files modified before the specified time are transferred. The time format must be yyyy-MM-dd HH:mm:ss.

            This parameter can be set to a macro variable of date and time. For example, ${timestamp(dateformat(yyyy-MM-dd HH:mm:ss))} indicates that only the files whose modification time is earlier than the current time are migrated.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            2019-07-30 00:00:00

            @@ -181,7 +181,7 @@

            DEK

            This parameter is displayed only when Encryption is set to AES-256-GCM. The key consists of 64 hexadecimal numbers and must be the same as the DEK configured during encryption. If the encryption and decryption keys are inconsistent, the system does not report an exception, but the decrypted data is incorrect.

            +

            This parameter is displayed only when Encryption is set to AES-256-GCM. The key consists of 64 hexadecimal numbers and must be the same as the DEK configured during encryption. If the encryption and decryption keys are inconsistent, the system does not report an exception, but the decrypted data is incorrect.

            DD0AE00DFECD78BF051BCFDA25BD4E320DB0A7AC75A1F3FC3D3C56A457DCDC1B

            Name of the HBase table that data will be exported from

            This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            TBL_2

            @@ -55,7 +55,7 @@

            (Optional) Start time (including the value) for extracting data. The format is yyyy-MM-dd HH:mm:ss. Only the data generated at the specified time and later is extracted.

            This parameter can be set to a macro variable of date and time. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            2019-01-01 20:00:00

            @@ -65,7 +65,7 @@

            (Optional) End time (excluding the value) for extracting data. The format is yyyy-MM-dd HH:mm:ss. Only the data generated before the time point is extracted.

            This parameter can be set to a macro variable of date and time.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            2019-02-01 20:00:00

            @@ -77,7 +77,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0051.html b/docs/dataartsstudio/umn/dataartsstudio_01_0051.html index 8d83be724..b1afc1a25 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0051.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0051.html @@ -26,7 +26,7 @@

            Hive table name. Click the icon next to the text box. The dialog box for selecting the table is displayed.

            This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            TBL_E

            @@ -35,7 +35,9 @@

            Read Mode

            Two read modes are available: HDFS and JDBC. By default, the HDFS mode is used. If you do not need to use the WHERE condition to filter data or add new fields on the field mapping page, select the HDFS mode.

            -
            • The HDFS mode shows good performance, but in this mode, you cannot use the WHERE condition to filter data or add new fields on the field mapping page.
            • The HDFS mode allows you to use the WHERE condition to filter data or add new fields on the field mapping page.
            +
            • The HDFS mode shows good performance, but in this mode, you cannot use the WHERE condition to filter data or add new fields on the field mapping page.
            • The HDFS mode allows you to use the WHERE condition to filter data or add new fields on the field mapping page.
              NOTE:

              If the migration source is Hive and JDBC is used to read data, CDM does not support concurrency. That is, Concurrent Extractors can only be set to 1.

              +
              +

            HDFS

            SQL Statement

            When Use SQL Statement is set to Yes, enter an SQL statement here. CDM exports data based on the SQL statement.

            -
            NOTE:
            • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
            • With statements are not supported.
            • Comments, such as -- and /*, are not supported.
            • Addition, deletion, and modification operations are not supported, including but not limited to the following:
              • load data
              • delete from
              • alter table
              • create table
              • drop table
              • into outfile
              -
            +
            NOTE:
            • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
            • With statements are not supported.
            • Comments, such as -- and /*, are not supported.
            • Addition, deletion, and modification operations are not supported, including but not limited to the following:
              • load data
              • delete from
              • alter table
              • create table
              • drop table
              • into outfile
              +
            • If the SQL statement is too long, the request fails to be delivered. If you continue to create a job, the system displays an error message indicating that the request is incorrect. In this case, you need to simplify or clear the SQL statement and try again.

            select id,name from sqoop.user;

            @@ -64,7 +66,7 @@

            This parameter is displayed when you select the HDFS read mode and click Show Advanced Attributes.

            This parameter indicates extracting the partition of a specified value. The attribute name is the partition name. You can configure multiple values (separated by spaces) or a field value range. The time macro function is supported.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            • Attribute value in the single-value or multi-value filtering scenario:

              ${dateformat(yyyyMMdd, -1, DAY)} ${dateformat(yyyyMMdd)}

              @@ -77,7 +79,7 @@

            This parameter is displayed when you select the JDBC read mode and click Show Advanced Attributes.

            This parameter indicates the WHERE clause to be extracted. If this parameter is not set, the entire table is extracted. If the table to be migrated does not contain the fields specified by the WHERE clause, the migration will fail.

            You can set a date macro variable to extract data generated on a specific date.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            age > 18 and age <= 60

            @@ -91,7 +93,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0052.html b/docs/dataartsstudio/umn/dataartsstudio_01_0052.html index fa80328bb..13c406489 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0052.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0052.html @@ -21,7 +21,7 @@

            Directory or file path from which data will be extracted. You can enter a maximum of 50 file paths. By default, the file paths are separated by vertical bars (|). You can also customize a file separator.

            Directory from which data is to be migrated. All files (including all nested subdirectories and their subfiles) in the directory will be migrated.

            This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            /ftp/a.csv|/ftp/b.txt

            @@ -39,7 +39,7 @@

            JSON Type

            This parameter is displayed only when File Format is set to JSON. Type of a JSON object stored in a JSON file. The options are JSON object and JSON array.

            +

            This parameter is displayed only when File Format is set to JSON. Type of a JSON object stored in a JSON file. The options are JSON object and JSON array.

            JSON object

            Use First Row as Header

            This parameter is displayed only when File Format is set to CSV. When you migrate a CSV file to a table, CDM writes all data to the table by default. If you set this parameter to Yes, CDM uses the first N rows of the CSV file as the heading row and does not write the row to the destination table.

            +

            This parameter is displayed only when File Format is set to CSV. When you migrate a CSV file to a table, CDM writes all data to the table by default. If you set this parameter to Yes, CDM uses the first N rows of the CSV file as the heading row and does not write the row to the destination table.

            Yes

            Directory Filter

            If you set Filter Type to Wildcard or Regex, enter a wildcard character to filter paths. The paths that meet the filtering condition are migrated. You can configure multiple paths separated by commas (,).

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            *input,*out

            @@ -182,7 +182,7 @@

            File Filter

            If you set Filter Type to Wildcard or Regex, enter a wildcard character to filter paths. The files that meet the filtering condition are migrated. You can configure multiple files separated by commas (,).

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            *.csv

            @@ -199,7 +199,7 @@

            If you set Time Filter to Yes, you can specify a point in time for Minimum Timestamp, and then only the files modified at or after the specified time are transferred. The time format must be yyyy-MM-dd HH:mm:ss.

            This parameter can be set to a macro variable of date and time. For example, ${timestamp(dateformat(yyyy-MM-dd HH:mm:ss,-90,DAY))} indicates that only files generated within the latest 90 days are migrated.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            2019-07-01 00:00:00

            @@ -209,7 +209,7 @@

            If you set Time Filter to Yes, you can specify a point in time for Maximum Timestamp, and then only the files modified before the specified time are transferred. The time format must be yyyy-MM-dd HH:mm:ss.

            This parameter can be set to a macro variable of date and time. For example, ${timestamp(dateformat(yyyy-MM-dd HH:mm:ss))} indicates that only the files whose modification time is earlier than the current time are migrated.

            -
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            +
            NOTE:

            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

            2019-07-30 00:00:00

            @@ -260,7 +260,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0053.html b/docs/dataartsstudio/umn/dataartsstudio_01_0053.html index 52a255369..ebf84728b 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0053.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0053.html @@ -49,9 +49,9 @@

            File Format

            Format used for transmitting data. The CSV and JSON formats are supported for migration to tables, and the binary format is supported for file migration.

            +

            Format used for transmitting data. The CSV and JSON formats are supported for migration to tables, and the binary format is supported for file migration.

            Binary

            +

            Binary

            Compression Format

            @@ -98,13 +98,20 @@

            .md5

            Query Parameter

            +

            If this parameter is set to Yes, the name of the object to be uploaded is a string with the query parameter removed.

            +

            No

            +
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0054.html b/docs/dataartsstudio/umn/dataartsstudio_01_0054.html index ea19b54de..6b25b5799 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0054.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0054.html @@ -25,8 +25,8 @@

      SQL Statement

      When Use SQL Statement is set to Yes, enter an SQL statement here. CDM exports data based on the SQL statement.

      -
      NOTE:
      • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
      • With statements are not supported.
      • Comments, such as -- and /*, are not supported.
      • Addition, deletion, and modification operations are not supported, including but not limited to the following:
        • load data
        • delete from
        • alter table
        • create table
        • drop table
        • into outfile
        -
      +
      NOTE:
      • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
      • With statements are not supported.
      • Comments, such as -- and /*, are not supported.
      • Addition, deletion, and modification operations are not supported, including but not limited to the following:
        • load data
        • delete from
        • alter table
        • create table
        • drop table
        • into outfile
        +
      • If the SQL statement is too long, the request fails to be delivered. If you continue to create a job, the system displays an error message indicating that the request is incorrect. In this case, you need to simplify or clear the SQL statement and try again.

      select id,name from sqoop.user;

      @@ -48,7 +48,7 @@

      Name of the table from which data will be extracted. This parameter is displayed when Use SQL Statement is set to No. Click the icon next to the text box to go to the page for selecting the table or directly enter a table name.

      If the desired table is not displayed, check whether the table exists or whether the login account has the permission to query metadata.

      This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

      -
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      +
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      NOTE:
      The table name can contain wildcard characters (*), which is used to export all tables whose names start with a certain prefix or end with a certain suffix. The number and types of fields in the tables must be the same. The examples are as follows:
      • table* indicates that all tables whose names starting with table are exported.
      • *table indicates that all tables whose names ending with table are exported.
      • *table* indicates that all tables whose names containing table are exported.
      @@ -75,7 +75,7 @@

      WHERE clause used to specify the data extraction range. This parameter is displayed when Use SQL Statement is set to No. If this parameter is not set, the entire table is extracted.

      You can set a date macro variable to extract data generated on a specific date.

      -
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      +
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      DS='${dateformat(yyyy-MM-dd,-1,DAY)}'

      @@ -139,7 +139,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0055.html b/docs/dataartsstudio/umn/dataartsstudio_01_0055.html index 26eaa6d01..001499282 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0055.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0055.html @@ -48,7 +48,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0056.html b/docs/dataartsstudio/umn/dataartsstudio_01_0056.html index 130fd54dd..b9154239c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0056.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0056.html @@ -61,7 +61,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0058.html b/docs/dataartsstudio/umn/dataartsstudio_01_0058.html index e89f2090e..b76adab32 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0058.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0058.html @@ -145,7 +145,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0059.html b/docs/dataartsstudio/umn/dataartsstudio_01_0059.html index ba52e8a8c..1a76f5bbe 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0059.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0059.html @@ -1,7 +1,7 @@

      From Elasticsearch or CSS

      -

      If the source link of a job is a link described in Link to Elasticsearch or Link to CSS, configure the source job parameters based on Table 1.

      +

      If the source link of a job is a link described in Elasticsearch Link Parameters or CSS Link Parameters, configure the source job parameters based on Table 1.

      @@ -14,7 +14,6 @@ @@ -81,7 +80,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0060.html b/docs/dataartsstudio/umn/dataartsstudio_01_0060.html index a3943489f..2079df817 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0060.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0060.html @@ -52,7 +52,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0061.html b/docs/dataartsstudio/umn/dataartsstudio_01_0061.html index 1a80f867f..e1d11fab2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0061.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0061.html @@ -1,6 +1,6 @@ -

      Destination Job Parameters

      +

      Configuring CDM Destination Job Parameters

      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0062.html b/docs/dataartsstudio/umn/dataartsstudio_01_0062.html index 7b1b44dc5..5a7538eea 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0062.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0062.html @@ -27,7 +27,7 @@ - + + + + - - + + + + + + + + + + + + + + + + + + + + - + + + + + + + +
      Table 1 Job parameters when Elasticsearch or CSS is the source

      Category

      Basic parameters

      -

      Index

      OBS directory to which data will be written. Do not add / in front of the directory name.

      This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

      -
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      +
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      directory/

      @@ -65,7 +65,7 @@

      KMS ID

      Data encryption key. This parameter is displayed when Encryption is set to KMS. Click next to the text box to select the KMS key that was created in DEW.

      +

      Data encryption key. This parameter is displayed when Encryption is set to KMS. Click next to the text box to select the KMS key that was created in DEW.

      • If the KMS key of the same project as that of the CDM cluster is used, you do not need to modify Project ID.
      • If the KMS key of another project is used, you need to modify Project ID.

      53440ccb-3e73-4700-98b5-71ff5476e621

      @@ -221,7 +221,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0063.html b/docs/dataartsstudio/umn/dataartsstudio_01_0063.html index 3fa01f59c..6fcec5a19 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0063.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0063.html @@ -15,7 +15,7 @@

      HDFS directory to which data will be written.

      This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

      -
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      +
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      /user/output

      @@ -139,7 +139,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0064.html b/docs/dataartsstudio/umn/dataartsstudio_01_0064.html index 9302a2c7d..d8d97e856 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0064.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0064.html @@ -15,7 +15,7 @@

      Name of the HBase table to which data will be written. If you want to create an HBase table, you can copy the field names from the migration source. Click the icon next to the text box. The dialog box for selecting the table is displayed.

      This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

      -
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      +
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      TBL_2

      @@ -83,7 +83,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0066.html b/docs/dataartsstudio/umn/dataartsstudio_01_0066.html index d9a8f0dda..04ca989c3 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0066.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0066.html @@ -22,7 +22,7 @@

      Destination table name. Click the icon next to the text box. The dialog box for selecting the table is displayed.

      This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

      -
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      +
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      TBL_X

      @@ -38,6 +38,14 @@

      Non-auto creation

      Source side null value conversion value

      +

      Value to which the source null value is converted

      +
      • TO_NULL
      • TO_EMPTY_STRRING
      • TO_NULL_STRING
      +

      TO_NULL

      +

      Clear Data Before Import

      Whether the data in the destination table is cleared before data import. The options are as follows:
      • Yes: The data is cleared.
      • No: The data is not cleared. Instead, it will be added to the existing table.
      @@ -46,29 +54,95 @@

      Yes

      Partition to Clear

      +

      Processing mode of newline characters

      This parameter is available when Clear Data Before Import is set to Yes.

      -

      When you enter the information about the partitions to be cleared, the data in the partitions will be cleared.

      +

      Policy for processing the newline characters in the data written to Hive textfile tables

      +
      • Delete
      • Replace with another string
      • Ignore
      +

      Delete

      +

      Hive Table Partition Field

      +

      This parameter is unavailable when Auto Table Creation is set to Non-auto Creation.

      +

      Partition fields for creating a Hive table. Use commas (,) to separate multiple fields.

      +

      A,B

      +

      Table Path

      +

      This parameter is unavailable when Auto Table Creation is set to Non-auto Creation.

      +

      It specifies the table path.

      +

      -

      +

      Storage Format

      +

      This parameter is unavailable when Auto Table Creation is set to Non-auto Creation.

      +

      It specifies the storage format.

      +
      • Row-based storage format: TEXTFILE
      • Column-based storage formats: ORC, RCFILE, and PARQUET
      +

      TEXTFILE data is stored in plaintext. If data contains special characters, data may be written incorrectly. Exercise caution when using this format. The ORC format is recommended.

      +

      ORC

      +

      ClearDataMode

      +

      This parameter is available when Clear Data Before Import is set to Yes.

      +

      It specifies the mode for clearing data in the Hive table.

      +
      • LOAD_OVERWRITE: A temporary data file directory is generated and loaded to the Hive table using the load overwrite syntax of Hive.
      • TRUNCATE: Data files in partitions are deleted, but partitions are not deleted.
        NOTE:

        If the destination is a partitioned table, you are advised to select LOAD_OVERWRITE. Otherwise, the cluster memory or disks may be overloaded.

        +
        +
      +

      TRUCATE

      +

      Partitions info

      +

      This parameter is available when Clear Data Before Import is set to Yes. If the destination is a partitioned table, you must specify partitions.

      +
      • If you select the TRUCATE mode, only the data files in the partitions are deleted.
      • If you select the LOAD_OVERWRITE mode, data is written to a specified partition and overwrites the existing data.

        +

      Single partition: year=2020,location=sun

      Multiple partitions: ['year=2020,location=sun', 'year=2021,location=earth']

      +

      Partitions of the previous day:

      +

      day='${dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY)}',

      Executing Analyze Statements

      After all data is written, the ANALYZE TABLE statement is asynchronously executed to accelerate the Hive table query. The SQL statement is as follows:

      +

      After all data is written, the ANALYZE TABLE statement is asynchronously executed to accelerate query of data from Hive tables.

      +

      Run the following SQL statements:

      • Non-partitioned table: ANALYZE TABLE tablename COMPUTE STATISTICS
      • Partitioned table: ANALYZE TABLE tablename PARTITION(partcol1[=val1], partcol2[=val2], ...) COMPUTE STATISTICS
      NOTE:

      Parameter Executing Analyze Statements applies only to the migration of a single table.

      +

      Running the ANALYZE statements may exert pressure on Hive.

      Yes

      Maximum memory size of the internal write queue

      +

      If the memory is insufficient, change the value of this parameter as needed. If the value is too small, the migration speed will be affected.

      +

      The value ranges from 1 to 128 MB. The default value is empty, indicating that there is no limit. If you set a value beyond the range, there is no limit.

      +

      16

      +

      Maximum memory size of the internal conversion queue

      +

      If the memory is insufficient, change the value of this parameter as needed. If the value is too small, the migration speed will be affected.

      +

      The value ranges from 1 to 128 MB. The default value is empty, indicating that there is no limit. If you set a value beyond the range, there is no limit.

      +

      16

      +
      -
      • When Hive serves as the destination end, a table whose storage format is ORC is automatically created.
      • Due to file format restrictions, complex data can be written only in ORC or Parquet format.
      • If the source Hive contains both the array and map types of data, the destination table format can only be the ORC or parquet complex type. If the destination table format is RC or TEXT, the source data will be processed and can be successfully written.
      • As the map type is an unordered data structure, the data type may change after a migration.
      • If Hive serves as the migration destination and the storage format is Textfile, delimiters must be explicitly specified in the statement for creating Hive tables. The following is an example:
        CREATE TABLE csv_tbl(
        +
        • If the source Hive contains both the array and map types of data, the destination table format can only be the ORC or parquet complex type. If the destination table format is RC or TEXT, the source data will be processed and can be successfully written.
        • As the map type is an unordered data structure, the data type may change after a migration.
        • If Hive serves as the migration destination and the storage format is Textfile, delimiters must be explicitly specified in the statement for creating Hive tables. The following is an example:
          CREATE TABLE csv_tbl(
           smallint_value smallint,
           tinyint_value tinyint,
           int_value int,
          @@ -100,7 +174,7 @@ STORED AS TEXTFILE;
        diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0068.html b/docs/dataartsstudio/umn/dataartsstudio_01_0068.html index c28de4e26..53b92d919 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0068.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0068.html @@ -35,7 +35,7 @@

      Name of the table to which data will be written. Click the icon next to the text box. The dialog box for selecting the table is displayed.

      This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

      -
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      +
      NOTE:

      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

      table

      @@ -121,7 +121,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0069.html b/docs/dataartsstudio/umn/dataartsstudio_01_0069.html index 57d7ee7b6..f75b8af79 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0069.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0069.html @@ -1,7 +1,7 @@

      To DDS

      -
      If the destination link of a job is a DDS link, configure the destination job parameters based on Table 1. +
      If the destination link of a job is a DDS link, configure the destination job parameters based on Table 1.
      - @@ -32,7 +32,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0070.html b/docs/dataartsstudio/umn/dataartsstudio_01_0070.html index c88bf0fdc..2ee0c0c13 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0070.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0070.html @@ -27,7 +27,7 @@ - @@ -68,7 +68,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0071.html b/docs/dataartsstudio/umn/dataartsstudio_01_0071.html index 3770ebbba..0cca9c83c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0071.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0071.html @@ -1,62 +1,75 @@

      To Elasticsearch/CSS

      -

      If the destination link of a job is a link described in Link to Elasticsearch or Link to CSS, configure the destination job parameters based on Table 1.

      +

      If the destination link of a job is a link described in Elasticsearch Link Parameters or CSS Link Parameters, configure the destination job parameters based on Table 1.

      +

      The parameters required for table/file migration are different from those for entire DB migration. The following table lists the parameters for table/file migration. The actual parameters are subject to those displayed on the console.

      +
      -
      Table 1 Parameter description

      Parameter

      Description

      @@ -12,7 +12,7 @@

      Database Name

      Database to which data is to be imported.

      +

      Database to which data is to be imported

      ddsdb

      Use Column Value as Field

      This parameter is displayed when Value Storage Type is set to Hash. Only Hash is supported. If this function is enabled, values are alternately used as fields and values in sequence except the primary key column.

      +

      This parameter is displayed when Value Storage Type is set to HASH. Only Hash is supported. If this function is enabled, values are alternately used as fields and values in sequence except the primary key column.

      Yes

      - - - - - - - @@ -178,7 +182,8 @@
      Table 1 Job parameters when Elasticsearch/CSS is the destination

      Parameter

      +
      - - - - - - - - - - - - - + + + + - - - - - - - @@ -65,7 +78,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0072.html b/docs/dataartsstudio/umn/dataartsstudio_01_0072.html index 1ac9f9595..cf47828bc 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0072.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0072.html @@ -2,7 +2,7 @@

      To DLI

      If the destination link of a job is a DLI link, configure the destination job parameters based on Table 1.

      -

      When you use CDM to migrate data to DLI, DLI generates data files in the dli-trans* temporary OBS bucket. Therefore, you need to grant the account corresponding to the AK/SK the permissions to read and write the dli-trans* bucket and create directories. For details about how to add OBS permission policies, see Adding an OBS Bucket Policy.

      +

      When data is migrated to DLI using CDM, DLI generates data files in the dli-trans* temporary OBS bucket. Therefore, you need to grant the user who uses the AK/SK the permissions to read and write the dli-trans* bucket and create directories. Otherwise, the migration will fail. For details about how to add permission policies for temporary bucket dli-trans*, see Adding an Authorization Policy for the dli-trans* Temporary Bucket.

      Table 1 Job parameters when Elasticsearch/CSS is the destination

      Parameter

      Description

      +

      Description

      Example Value

      +

      Example Value

      Index

      +

      Index

      Elasticsearch index, which is similar to the name of a relational database. CDM supports automatic creation of indexes and field types. The index and field type names can contain only lowercase letters.

      +

      Elasticsearch index, which is similar to the name of a relational database. CDM supports automatic creation of indexes and field types. The index and field type names can contain only lowercase letters.

      index

      +

      index

      Type

      +

      Type

      Elasticsearch type, which is similar to the table name of a relational database. The type name can contain only lowercase letters.

      +

      Elasticsearch type, which is similar to the table name of a relational database. The type name can contain only lowercase letters.

      NOTE:

      Elasticsearch 7.x and later versions do not support custom types. Instead, only the _doc type can be used. In this case, this parameter does not take effect even if it is set.

      type

      +

      type

      Pipeline ID

      +

      Operation

      Pipeline used to convert the data format after data is transferred to Elasticsearch. Pipeline IDs are ready for use after being created in Kibana.

      +

      Operation type

      +
      • INDEX: No primary key is required. Elasticsearch generates IDs so that data is written to a new file with a unique ID for each write operation.
      • CREATE: A primary key needs to be specified. If the primary key already exists, the write operation fails.
      • UPDATE: A primary key needs to be specified. If the primary key already exists, the original data is overwritten.
      • UPSERT: A primary key needs to be specified. If a primary key already exists, the existing data is overwritten. If there is no primary key, a new document is created for writing data.

      pipeline_id

      +

      INDEX

      Write ES with Routing

      +

      Pipeline ID

      If you enable this function, a column can be written to Elasticsearch as a route.

      +

      ID of the pipeline used to convert the format of the data transferred to Elasticsearch.

      +

      If the destination is Elasticsearch, you need to create a pipeline ID in Kibana first.

      +

      If the destination is CSS, you do not need to create a pipeline ID. Instead, enter the name of the configuration file, which is name by default.

      +

      If the destination is Elasticsearch: pipeline_id

      +

      If the destination is CSS: name (name of the configuration file)

      +

      Write ES with Routing

      +

      If you enable this function, a column can be written to Elasticsearch as a route.

      NOTE:

      Before enabling this function, create indexes at the destination to improve the query efficiency.

      No

      +

      No

      Route Column

      +

      Route Column

      This parameter is available when Write ES with Routing is set to Yes. It specifies the destination routing column. If the destination index exists but the column information cannot be obtained, you can manually enter the column. The route column can be empty. If it is empty, no routing value is specified for the data written to Elasticsearch.

      +

      This parameter is available when Write ES with Routing is set to Yes. It specifies the destination routing column. If the destination index exists but the column information cannot be obtained, you can manually enter the column. The route column can be empty. If it is empty, no routing value is specified for the data written to Elasticsearch.

      value1

      +

      value1

      Periodically Create Index

      +

      Periodically Create Index

      For streaming jobs that continuously write data to Elasticsearch, CDM periodically creates indexes and writes data to the indexes, which helps you delete expired data. The indexes can be created based on the following periods:
      • Every hour: CDM creates indexes on the hour. The new indexes are named in the format of Index name+Year+Month+Day+Hour, for example, index2018121709.
      • Every day: CDM creates indexes at 00:00 every day. The new indexes are named in the format of Index name+Year+Month+Day, for example, index20181217.
      • Every week: CDM creates indexes at 00:00 every Monday. The new indexes are named in the format of Index name+Year+Week, for example, index201842.
      • Every month: CDM creates indexes at 00:00 on the first day of each month. The new indexes are named in the format of Index name+Year+Month, for example, index201812.
      • Do not create: Do not create indexes periodically.
      +
      For streaming jobs that continuously write data to Elasticsearch, CDM periodically creates indexes and writes data to the indexes, which helps you delete expired data. The indexes can be created based on the following periods:
      • Every hour: CDM creates indexes on the hour. The new indexes are named in the format of Index name+Year+Month+Day+Hour, for example, index2018121709.
      • Every day: CDM creates indexes at 00:00 every day. The new indexes are named in the format of Index name+Year+Month+Day, for example, index20181217.
      • Every week: CDM creates indexes at 00:00 every Monday. The new indexes are named in the format of Index name+Year+Week, for example, index201842.
      • Every month: CDM creates indexes at 00:00 on the first day of each month. The new indexes are named in the format of Index name+Year+Month, for example, index201812.
      • Do not create: Do not create indexes periodically.

      When extracting data from a file, you must configure a single extractor, which means setting Concurrent Extractors to 1. Otherwise, this parameter is invalid.

      Every hour

      +

      Every hour

      Table 1 Parameter description

      Parameter

      @@ -72,16 +72,94 @@
      -

      Adding an OBS Bucket Policy

      1. Log in to the IAM console.
      2. In the navigation pane, choose Permissions > Policies/Roles and click Create Custom Policy in the upper right corner.

        Figure 1 Creating a custom policy
        -

      3. Enter a policy name and set Policy Content.

        Figure 2 Configuring the policy
        -

        -

      4. Enter the policy description and click OK.
      +

      Adding an Authorization Policy for the dli-trans* Temporary Bucket

      1. Log in to the IAM console.
      2. In the navigation pane, choose Permissions > Policies/Roles and click Create Custom Policy in the upper right corner.

        Figure 1 Creating a custom policy
        +

      3. On the Create Custom Policy page, select JSON for Policy View and create custom policy obs_dli-trans.

        {
        +    "Version": "1.1",
        +    "Statement": [
        +        {
        +            "Effect": "Allow",
        +            "Action": [
        +                "obs:object:GetObject",
        +                "obs:object:DeleteObjectVersion",
        +                "obs:bucket:GetBucketLocation",
        +                "obs:object:GetAccessLabel",
        +                "obs:bucket:PutEncryptionConfiguration",
        +                "obs:bucket:PutBucketStoragePolicy",
        +                "obs:object:DeleteAccessLabel",
        +                "obs:bucket:PutBucketCustomDomainConfiguration",
        +                "obs:bucket:GetLifecycleConfiguration",
        +                "obs:bucket:PutBucketInventoryConfiguration",
        +                "obs:bucket:DeleteDirectColdAccessConfiguration",
        +                "obs:object:AbortMultipartUpload",
        +                "obs:bucket:PutBucketLogging",
        +                "obs:bucket:DeleteBucketWebsite",
        +                "obs:object:DeleteObject",
        +                "obs:bucket:PutBucketVersioning",
        +                "obs:bucket:GetBucketWebsite",
        +                "obs:bucket:GetBucketLogging",
        +                "obs:bucket:DeleteBucketCustomDomainConfiguration",
        +                "obs:object:PutObject",
        +                "obs:object:RestoreObject",
        +                "obs:bucket:PutReplicationConfiguration",
        +                "obs:bucket:GetBucketQuota",
        +                "obs:object:GetObjectVersionAcl",
        +                "obs:bucket:DeleteBucket",
        +                "obs:bucket:CreateBucket",
        +                "obs:bucket:GetDirectColdAccessConfiguration",
        +                "obs:bucket:PutDirectColdAccessConfiguration",
        +                "obs:bucket:GetBucketAcl",
        +                "obs:bucket:GetBucketVersioning",
        +                "obs:bucket:GetBucketInventoryConfiguration",
        +                "obs:bucket:GetBucketStoragePolicy",
        +                "obs:bucket:GetEncryptionConfiguration",
        +                "obs:bucket:PutBucketCORS",
        +                "obs:bucket:PutBucketTagging",
        +                "obs:bucket:GetBucketTagging",
        +                "obs:bucket:PutLifecycleConfiguration",
        +                "obs:bucket:GetBucketCustomDomainConfiguration",
        +                "obs:object:ListMultipartUploadParts",
        +                "obs:object:ModifyObjectMetaData",
        +                "obs:bucket:ListBucketVersions",
        +                "obs:bucket:PutBucketQuota",
        +                "obs:object:PutAccessLabel",
        +                "obs:bucket:ListBucket",
        +                "obs:bucket:GetBucketCORS",
        +                "obs:bucket:DeleteBucketInventoryConfiguration",
        +                "obs:object:GetObjectVersion",
        +                "obs:bucket:PutBucketWebsite",
        +                "obs:bucket:DeleteReplicationConfiguration",
        +                "obs:object:GetObjectAcl",
        +                "obs:bucket:GetBucketNotification",
        +                "obs:bucket:PutBucketNotification",
        +                "obs:bucket:GetReplicationConfiguration",
        +                "obs:bucket:GetBucketPolicy",
        +                "obs:bucket:DeleteBucketTagging",
        +                "obs:bucket:GetBucketStorage"
        +            ],
        +            "Resource": [
        +                "OBS:*:*:object:*",
        +                "OBS:*:*:bucket:dli-trans*"
        +            ]
        +        }
        +    ]
        +}
        +
        Figure 2 Creating custom policy obs_dli-trans
        +

        +

      4. Click OK.
      5. In the navigation pane, choose User Groups, locate the user group to which the DLI link user using the AK/SK belongs, and click Authorize to assign the custom obs_dli-trans policy to the user.

        Figure 3 Assigning the custom obs_dli-trans policy to a user group
        +

        +

      -

      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0074.html b/docs/dataartsstudio/umn/dataartsstudio_01_0074.html index c50ba84dd..e998cfd21 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0074.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0074.html @@ -38,7 +38,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0075.html b/docs/dataartsstudio/umn/dataartsstudio_01_0075.html index 928dd9397..c676ceb80 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0075.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0075.html @@ -8,7 +8,7 @@

      Constraints

      Field names of the source and destination parameters cannot contain ampersands (&) or number signs (%).

      -

      Prerequisites

      +

      Prerequisites

      • The CDM cluster can communicate with the data source.

      Procedure

      1. Log in to the management console and choose Service List > Cloud Data Migration. In the left navigation pane, choose Cluster Management. Locate the target cluster and click Job Management.
      2. Choose Entire DB Migration > Create Job. The page for configuring the job is displayed.
      3. Configure the related parameters of the source database according to Table 1.

        @@ -62,25 +62,28 @@

      Start Time

      Start time (included). The format is yyyy-MM-dd hh:mm:ss. The dateformat time macro variable function is supported. Examples: 2017-12-31 20:00:00, ${dateformat(yyyy-MM-dd, -1, DAY)} 02:00:00, and ${dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY)}

      +

      Start time (included). The format is yyyy-MM-dd hh:mm:ss. The dateformat time macro variable function is supported.

      +

      Examples: 2017-12-31 20:00:00, ${dateformat(yyyy-MM-dd, -1, DAY)} 02:00:00, and ${dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY)}

      -

      +

      "2017-12-31 20:00:00"

      End Time

      End time (excluded) The format is yyyy-MM-dd hh:mm:ss. The dateformat time macro variable function is supported. Examples: 2018-01-01 20:00:00, ${dateformat(yyyy-MM-dd, -1, DAY)} 02:00:00, and ${dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY)}

      +

      End time (excluded) The format is yyyy-MM-dd hh:mm:ss. The dateformat time macro variable function is supported.

      +

      Examples: 2018-01-01 20:00:00, ${dateformat(yyyy-MM-dd, -1, DAY)} 02:00:00, and ${dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY)}

      -

      +

      "2018-01-01 20:00:00"

      Redis

      Key Filter Character

      Filter character used to determine the keys to be migrated For example, if the value of this parameter is a*, all asterisks (*) will be migrated.

      +

      Filter character used to determine the keys to be migrated

      +

      For example, if the value of this parameter is a*, all asterisks (*) will be migrated.

      -

      +

      a*

      DDS

      @@ -94,7 +97,8 @@

      Query Filter

      Filter used to match documents. Example: {HTTPStatusCode:{$gt:"400",$lt:"500"},HTTPMethod:"GET"}

      +

      Filter used to match documents.

      +

      Example: {HTTPStatusCode:{$gt:"400",$lt:"500"},HTTPMethod:"GET"}

      -

      -

    • If a relational database is migrated, after job parameters are configured, click Next to access the page for selecting tables. You can select the tables to be migrated to the migration destination based on your requirements.
    • Click Next and set job parameters.

      Figure 1 Task parameters
      +

    • If you are migrating an entire relational database, click Next after configuring job parameters to select source and destination tables. Ensure that the destination table names are the same as the source table names. For example, if the source table name is test, the destination table name must also be test.

      Figure 1 Field mapping
      +

    • Click Next and set job parameters.

      Figure 2 Task parameters
      Table 3 describes related parameters.
      @@ -197,7 +202,9 @@ - @@ -254,7 +261,14 @@
      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0076.html b/docs/dataartsstudio/umn/dataartsstudio_01_0076.html index 72c26d6ad..8ae346973 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0076.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0076.html @@ -48,9 +48,9 @@
      Table 3 Task configuration parameters

      Parameter

      Concurrent Extractors

      Number of extractors to be concurrently executed. Generally, retain the default value.

      +

      Maximum number of threads of the job for reading data from the source

      +
      NOTE:

      The number of concurrent threads may be less than or equal to the value of this parameter for some data sources that do not support concurrent extraction, for example, CSS and ClickHouse.

      +

      1

      -
      Figure 1 Setting Maximum Concurrent Extractors for a CDM cluster
      +
      Figure 1 Setting Maximum Concurrent Extractors for a CDM cluster
    • Configure the number of concurrent extractors based on the following rules:
      1. When data is to be migrated to files, CDM does not support multiple concurrent tasks. In this case, set a single process to extract data.
      2. If each row of the table contains less than or equal to 1 MB data, data can be extracted concurrently. If each row contains more than 1 MB data, it is recommended that data be extracted in a single thread.
      3. Set Concurrent Extractors for a job based on Maximum Concurrent Extractors for the cluster. It is recommended that Concurrent Extractors is less than Maximum Concurrent Extractors.
      4. If the destination is DLI, you are advised to set the number of concurrent extractors to 1. Otherwise, data may fail to be written.
      -
      Figure 2 Setting Concurrent Extractors for a job
      +
      Figure 2 Setting Concurrent Extractors for a job
    • @@ -60,3 +60,10 @@
      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0081.html b/docs/dataartsstudio/umn/dataartsstudio_01_0081.html index 374cf4af5..4b5c4adbb 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0081.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0081.html @@ -1,6 +1,6 @@ -

      Managing Jobs

      +

      Creating a Job in a CDM Cluster

      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0082.html b/docs/dataartsstudio/umn/dataartsstudio_01_0082.html index 69abedd9f..13e3efdaa 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0082.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0082.html @@ -1,6 +1,6 @@ -

      Scheduling Job Execution

      +

      Configuring a Scheduled CDM Job

      CDM supports scheduled execution of table/file migration jobs by minute, hour, day, week, and month. This section describes how to configure scheduled job parameters.

      • When configuring scheduled jobs, do not set the same scheduled time for different jobs. Instead, set different times to avoid exceptions.
      • If you use DataArts Studio DataArts Factory to schedule the CDM migration job and configure this parameter, both configurations take effect. To ensure unified service logic and avoid scheduling conflicts, enable job scheduling in DataArts Factory and do not configure a scheduled task for the job in DataArts Migration.

      • The scheduled execution function uses the Java Quartz timer, which is similar to the Cron expression configuration. It parses the minute, hour, day, and month of the start time, and constructs a cronb expression.

        For example, in the daily scheduling mode where the interval is set to 1 day: if the current time is 2022-10-14 12:00 and the start time is set to 2022-10-14 00:00, the job is executed at 2022-10-15 00:00; if the current time is 2022-10-14 12:00 and the start time is set to 2022-10-14 00:00, the job is executed at 2022-10-15 00:00.

        @@ -9,45 +9,51 @@

      Scheduling Job Execution by Minute

      CDM allows jobs to be executed every several minutes. It is recommended that the cycle be at least 5 minutes.
      • Start Time: indicates the time when the scheduled configuration takes effect, or the first time when the job is automatically executed.
      • Cycle (minutes): indicates the interval when a job is executed starting from the start time.
      • End Time: This parameter is optional. If it is not set, the scheduled job keeps being automatically executed. If it is set, the scheduled job will be automatically stopped at the end time.
      -
      Figure 1 Scheduling job execution by minute
      +
      Figure 1 Scheduling job execution by minute

      -

      For example, the settings shown in Figure 1 mean that the job will be automatically executed at 00:00 on January 1, 2023 for the first time at a cycle of 30 minutes until 23:59 on December 31, 2023.

      +

      For example, the settings shown in the above figure mean that the job will be automatically executed at 00:00 on January 1, 2023 for the first time at a cycle of 30 minutes until 23:59 on December 31, 2023.

      Scheduling Job Execution by Hour

      CDM allows jobs to be executed every several hours.
      • Cycle (hours): indicates the interval when a job is automatically executed.
      • Trigger Time (minute): indicates the exact time in each hour when a scheduled task is triggered. The value ranges from 0 to 59. You can set a maximum of 60 values and use commas (,) to separate these values. However, the values must be unique.

        If the trigger time is not within the validity period, the system selects a trigger time closest to the validity period for the scheduled job to be automatically executed at the first time. The following gives an example:

        • Start Time: 1:20
        • Cycle (hours): 3
        • Trigger Time (minute): 10
      • Validity Period: includes Start Time and End Time.
        • Start Time: indicates the time when the scheduled configuration takes effect.
        • End Time: This parameter is optional, which indicates the time when the scheduled job is automatically stopped. If this parameter is not set, the scheduled job keeps being automatically executed.
      -
      Figure 2 Scheduling job execution by hour
      +
      Figure 2 Scheduling job execution by hour

      -

      For example, the settings shown in Figure 2 mean that the job will be automatically executed at 00:10 on January 1, 2023 for the first time, at 00:30 for the second time, and at 00:50 for the third time. It will be executed three times every two hours until 23:59 on December 31, 2023.

      +

      For example, the settings shown in the above figure mean that the job will be automatically executed at 00:10 on January 1, 2023 for the first time, at 00:30 for the second time, and at 00:50 for the third time. It will be executed three times every two hours until 23:59 on December 31, 2023.

      -

      Scheduling Job Execution by Day

      CDM allows jobs to be executed every several days.
      • Cycle (days): indicates the interval when a job is executed starting from the start time.
      • Validity Period: includes Start Time and End Time.
        • Start Time: indicates the time when the scheduled configuration takes effect, or the first time when the job is automatically executed.
        • End Time: This parameter is optional, which indicates the time when the scheduled job is automatically stopped. If this parameter is not set, the scheduled job keeps being automatically executed.
        +

        Scheduling Job Execution by Day

        CDM allows jobs to be executed every several days.
        • Cycle (days): indicates the interval when a job is executed starting from the start time.
        • Validity Period: includes Start Time and End Time.
          • Start Time: indicates the time when the scheduled configuration takes effect, or the first time when the job is automatically executed.
          • End Time: This parameter is optional, which indicates the time when the scheduled job is automatically stopped. If this parameter is not set, the scheduled job keeps being automatically executed.
        -
        Figure 3 Scheduling job execution by day
        +
        Figure 3 Scheduling job execution by day

        -

        For example, the settings shown in Figure 3 mean that the job will be automatically executed at 00:00 on January 1, 2023 for the first time, and will be executed once every three days. The configuration is valid permanently.

        -

        +

        For example, the settings shown in the above figure mean that the job will be automatically executed at 00:00 on January 1, 2023 for the first time, and will be executed once every three days. The configuration is valid permanently.

        Scheduling Job Execution by Week

        CDM allows jobs to be executed every several weeks.
        • Cycle (weeks): indicates the interval when a scheduled job is executed starting from the start time.
        • Trigger Time (day): You can specify the day of each week when the job is automatically executed. One or more days can be selected at a time.
        • Validity Period: includes Start Time and End Time.
          • Start Time: indicates the time when the scheduled configuration takes effect.
          • End Time: This parameter is optional, which indicates the time when the scheduled job is automatically stopped. If this parameter is not set, the scheduled job keeps being automatically executed.
        -
        Figure 4 Scheduling job execution by week
        +
        Figure 4 Scheduling job execution by week

        -

        For example, the settings shown in Figure 4 mean that the job will be automatically executed at 00:00 every Tuesday, Saturday, and Sunday every two weeks starting from 00:00 on January 1, 2023 until 23:59 on December 31, 2023.

        +

        For example, the settings shown in the above figure mean that the job will be automatically executed at 00:00 every Tuesday, Saturday, and Sunday every two weeks starting from 00:00 on January 1, 2023 until 23:59 on December 31, 2023.

        Scheduling Job Execution by Month

        CDM allows jobs to be executed every several months.
        • Cycle (months): indicates the interval when a scheduled job is executed starting from the start time.
        • Trigger Time (day): indicates the day of each month when the job is executed. The value ranges from 1 to 31. You can set multiple values and use commas (,) to separate these values. However, the values must be unique.
        • Validity Period: includes Start Time and End Time.
          • Start Time: indicates the time when the scheduled configuration takes effect. The automatic execution time is accurate to hour, minute, and second.
          • End Time: This parameter is optional, which indicates the time when the scheduled job is automatically stopped. If this parameter is not set, the scheduled job keeps being automatically executed.
        -
        Figure 5 Scheduling job execution by month
        +
        Figure 5 Scheduling job execution by month

        -

        For example, the settings shown in Figure 5 mean that the job will be automatically executed at 00:00 on the 5th and 25th days of each month starting from 00:00 on January 1, 2023 until 23:59 on December 31, 2023.

        +

        For example, the settings shown in the above figure mean that the job will be automatically executed at 00:00 on the 5th and 25th days of each month starting from 00:00 on January 1, 2023 until 23:59 on December 31, 2023.

      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0083.html b/docs/dataartsstudio/umn/dataartsstudio_01_0083.html index 4a1be4618..664f25faf 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0083.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0083.html @@ -1,52 +1,54 @@ -

      Job Configuration Management

      +

      Managing CDM Job Configuration

      On the Settings tab page, you can perform the following operations:

      Maximum Concurrent Extractors

      Maximum number of concurrent extraction tasks in a cluster

      +

      This parameter is also available on the Cluster Configuration page. You can change its value either on this page or the Cluster Configuration page.

      +
      CDM migrates data through data migration jobs. It works in the following way:
      1. When data migration jobs are submitted, CDM splits each job into multiple tasks based on the Concurrent Extractors parameter in the job configuration.

        Jobs for different data sources may be split based on different dimensions. Some jobs may not be split based on the Concurrent Extractors parameter.

      2. CDM submits the tasks to the running pool in sequence. Tasks (defined by Maximum Concurrent Extractors) run concurrently. Excess tasks are queued.
      -

      By setting an appropriate number of concurrent extractors for a job and the maximum number of concurrent extractors for the cluster, you can accelerate migration. You can configure the number of concurrent extractors as follows:

      +

      By setting appropriate values for the Concurrent Extractors and Maximum Concurrent Extractors parameters, you can accelerate migration.

      1. You are advised to set Maximum Concurrent Extractors to twice the number of vCPUs. For details, see Table 1. -
        Table 1 Recommended maximum number of concurrent extractors for a CDM cluster

        Flavor

        +
        - - - - - - - - - - -
        Table 1 Recommended maximum number of concurrent extractors for a CDM cluster

        Flavor

        vCPUs/Memory

        +

        vCPUs/Memory

        Recommended Maximum Concurrent Extractors

        +

        Recommended Maximum Concurrent Extractors

        cdm.large

        +

        cdm.large

        8 vCPUs, 16 GB

        +

        8 vCPUs, 16 GB

        16

        +

        16

        cdm.xlarge

        +

        cdm.xlarge

        16 vCPUs, 32 GB

        +

        16 vCPUs, 32 GB

        32

        +

        32

        cdm.4xlarge

        +

        cdm.4xlarge

        64 vCPUs, 128 GB

        +

        64 vCPUs, 128 GB

        128

        +

        128

        -
      2. Configure the number of concurrent extractors based on the following rules:
        1. When data is to be migrated to files, CDM does not support multiple concurrent tasks. In this case, set a single process to extract data.
        2. If each row of the table contains less than or equal to 1 MB data, data can be extracted concurrently. If each row contains more than 1 MB data, it is recommended that data be extracted in a single thread.
        3. Set Concurrent Extractors for a job based on Maximum Concurrent Extractors for the cluster. It is recommended that Concurrent Extractors is less than Maximum Concurrent Extractors.
        4. If the destination is DLI, you are advised to set the number of concurrent extractors to 1. Otherwise, data may fail to be written.
        +
      3. Configure the number of concurrent extractors based on the following rules:
        1. When data is to be migrated to files, CDM does not support multiple concurrent tasks. In this case, set a single process to extract data.
        2. If each row of the table contains less than or equal to 1 MB data, data can be extracted concurrently. If each row contains more than 1 MB data, it is recommended that data be extracted in a single thread.
        3. Set Concurrent Extractors for a job based on Maximum Concurrent Extractors for the cluster. It is recommended that the value of Concurrent Extractors is less than that of Maximum Concurrent Extractors.
        4. If the migration source is Hive and JDBC is used to read data, CDM does not support multi-concurrency. In this case, set the number of concurrent extractors to 1.
        5. If the destination is DLI, you are advised to set the number of concurrent extractors to 1. Otherwise, data may fail to be written.
      4. -

        Scheduled Backup/Restoration

        This function depends on the OBS service.

        -
        • Prerequisites

          An OBS link has been created. For details, see Link to OBS.

          +

          Scheduled Backup/Restoration

          This function depends on the OBS service. Backup files cannot be automatically aged. You need to manually delete backup files on a regular basis.

          +
          • Prerequisites

            An OBS link has been created. For details, see OBS Link Parameters.

          • Scheduled backup

            On the Job Management page, click Settings and configure Scheduled Backup and its related parameters.

            Table 2 Scheduled backup parameters

            Parameter

            @@ -112,7 +114,7 @@
            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0084.html b/docs/dataartsstudio/umn/dataartsstudio_01_0084.html index 2ebf6874a..bf0b4143d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0084.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0084.html @@ -1,30 +1,28 @@ -

            Managing a Single Job

            +

            Managing a CDM Job

            Existing CDM jobs can be viewed, modified, deleted, started, and stopped. This section describes how to view and modify a job.

            Viewing a Job

            • Viewing job status

              The job status can be New, Pending, Booting, Running, Failed, Succeeded, or Stopped.

              Pending indicates that the job is waiting to be scheduled by the system, and Booting indicates that the data to be migrated is being analyzed.

              -
            • Viewing the historical records

              On the Historical Record page, you can view job execution records, read/write statistics, and job execution logs.

              +
            • Viewing the historical records

              You can view job execution results and historical information in the last 30 days, including job execution records, read/write statistics, and job execution logs.

            • Viewing job logs

              On the Historical Record page, you can view all logs of a job.

              Alternatively, in the Operation column, choose More > Log to view the latest logs of the job.

            • Viewing the JSON file of a job

              You can directly edit the JSON file of a job, which is equivalent to modifying the parameter settings of the job.

            • Querying the job statistics

              You can open the preview window of a configured database job and view up to 1,000 pieces of data. By comparing the number of data records of the migration source and destination, you can check whether the migration was successful and whether data was lost.

            -

            Modifying a Job

            • Modifying the job parameters

              You can reconfigure job parameters, but you cannot reselect source and destination links.

              +

              Modifying a Job

              • Modifying the job parameters

                You can reconfigure job parameters and reselect source and destination links.

              • Editing the JSON file of a job

                You can directly edit the JSON file of a job, which is equivalent to modifying the parameter settings of the job.

              -

              Procedure

              1. Log in to the management console and choose Service List > Cloud Data Migration. In the left navigation pane, choose Cluster Management. Locate the target cluster and click Job Management.
              2. Click Historical Jobs to view all historical jobs executed in the latest month.

                CDM stores the jobs executed in the last month, including one-time jobs (jobs that are automatically deleted after execution) and jobs that are executed periodically. You can view and re-execute the jobs on the Historical Jobs tab page.

                -

                For a job that is executed periodically, a historical job is generated on the Historical Jobs tab page each time when the job is executed, regardless of whether the job is executed successfully. The names of historical jobs will be the same as the original job but with a random character string appended.

                -

              3. Click Table/File Migration. The job list is displayed. You can perform the following operations on a single job:

                • Modify the job parameters: Click Edit in the Operation column to modify the job parameters.
                • Run the job: Click Run in the Operation column to manually start the job.
                • View the historical records: Click Historical Record in the Operation column. On the Historical Record page that is displayed, view the job's historical execution records and read/write statistics. Click Log to view the job logs.
                • Delete the job: Choose More > Delete in the Operation column to delete the job.
                • Stop the job: Choose More > Stop in the Operation column to stop the job.
                • View the job JSON: Choose More > View Job JSON in the Operation column to view the job JSON.
                • Edit the job JSON: Choose More > Edit Job JSON in the Operation column to edit the job JSON files, which is similar to modify the job parameters.
                • Configure a scheduled job: Locate a job and choose More > Configure Scheduled Execution. You can set the cycle for periodically executing the job. For details, see Scheduling Job Execution.
                • View logs: Locate a job, click More in the Operation column, and select Log to view the latest log of the job.

                  You can also view all logs of the job on the Historical Record page.

                  +

                  Procedure

                  1. Log in to the management console and choose Service List > Cloud Data Migration. In the left navigation pane, choose Cluster Management. Locate the target cluster and click Job Management.
                  2. Click Table/File Migration. The job list is displayed. You can perform the following operations on a single job:

                    • Modify the job parameters: Click Edit in the Operation column to modify the job parameters.
                    • Run the job: Click Run in the Operation column to manually start the job.
                    • View the historical records: Click Historical Record in the Operation column. On the Historical Record page that is displayed, view the job's historical execution records and read/write statistics. Click Log to view the job logs.
                    • Delete the job: Choose More > Delete in the Operation column to delete the job.
                    • Stop the job: Choose More > Stop in the Operation column to stop the job.
                    • View the job JSON: Choose More > View Job JSON in the Operation column to view the job JSON.
                    • Edit the job JSON: Choose More > Edit Job JSON in the Operation column to edit the job JSON files, which is similar to modify the job parameters.
                    • Configure a scheduled job: Locate a job and choose More > Configure Scheduled Execution. You can set the cycle for periodically executing the job. For details, see Configuring a Scheduled CDM Job.
                    • View logs: Locate a job, click More in the Operation column, and select Log to view the latest log of the job.

                      You can also view all logs of the job on the Historical Record page.

                    • Retry the job: Locate a failed job, click More in the Operation column, and select Retry. The job will be automatically retried three times.

                  3. After the modification, click Save or Save and Run.
              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0085.html b/docs/dataartsstudio/umn/dataartsstudio_01_0085.html index eb6636f29..6502841cf 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0085.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0085.html @@ -1,17 +1,19 @@ -

              Managing Jobs in Batches

              -

              Scenario

              This section describes how to manage CDM table/file migration jobs in batches. The following operations are involved:
              • Manage jobs by group.
              • Run jobs in batches.
              • Delete jobs in batches.
              • Export jobs in batches.
              • Import jobs in batches.
              +

              Managing CDM Jobs

              +

              Scenario

              This section describes how to manage CDM table/file migration jobs in batches. The following operations are supported:
              • Managing jobs by group
              • Running jobs in batches
              • Deleting jobs in batches
              • Exporting jobs in batches
              • Importing jobs in batches
              You can export and import jobs in batches in the following scenarios:
              • Job migration between CDM clusters: You can migrate jobs from a cluster of an earlier version to a new version.
              • Job backup: You can stop or delete CDM clusters to reduce costs. In this case, you can export the job scripts in batches and save them, and create a cluster and import the job scripts if necessary.
              • Batch job creation: You can manually create a job and export the job configuration file in JSON format. Copy the content in the JSON file to the same file or new files, and then import the file/files to CDM to create jobs in batches.

              Procedure

              1. Log in to the management console and choose Service List > Cloud Data Migration. In the left navigation pane, choose Cluster Management. Locate the target cluster and click Job Management.
              2. Click Table/File Migration. The job list is displayed. You can perform the following batch operations:

                • Manage jobs by group.

                  CDM allows users to add, modify, search for, and delete job groups. When a group is deleted, all jobs in the group are deleted.

                  -

                  In the third step of creating a job, if jobs have been assigned to different groups, you can display, start, or export jobs by group.

                  +

                  When creating a job, if jobs have been assigned to different groups, you can display, start, or export jobs by group.

                  +

                  Starting jobs by group will run all jobs in the group. If user isolation is enabled, starting jobs by group will still run all jobs in the group even if otherIAM users in the a cloud platform account cannot view the jobs in the group. Therefore, you are not advised to start jobs by group in user isolation scenarios.

                  +
                • Run jobs in batches.

                  After selecting one or more jobs, click Run to start these jobs in batches.

                • Delete jobs in batches.

                  After selecting one or more jobs, click Delete to delete these jobs in batches.

                • Export jobs in batches.

                  Click Export.

                  -
                  Figure 1 Export
                  +
                  Figure 1 Export
                  • All jobs and links: Export all jobs and links at a time.
                  • All jobs: Export all jobs at a time.
                  • All links: Export all links at a time.
                  • Jobs by name: Select the jobs to export and click OK.
                  • All jobs by groups: Select the group to export and click OK.

                  Exported jobs are stored in JSON files, which can be used as backups or imported to other clusters.

                  For security purposes, no link password is exported when jobs are exported. All passwords are replaced by Add password here.

                  @@ -26,7 +28,7 @@
                  diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0086.html b/docs/dataartsstudio/umn/dataartsstudio_01_0086.html index 518d99c59..1fa88c00c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0086.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0086.html @@ -31,7 +31,7 @@
              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0088.html b/docs/dataartsstudio/umn/dataartsstudio_01_0088.html index 930ff9831..7daaac05b 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0088.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0088.html @@ -13,8 +13,8 @@

              Creating a Cloud Search Service Link

              1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.
              2. Select Cloud Search Service and click Next. On the page that is displayed, configure the CSS link parameters.

                • Name: Enter a custom link name, for example, csslink.
                • Elasticsearch Server List: Enter the IP address and port number of the Cloud Search Service cluster (cluster later than 5.x). The format is ip:port. Use semicolons to separate multiple addresses. For example, 192.168.0.1:9200;192.168.0.2:9200.
                • Username and Password: Enter the username and password used for logging in to the Cloud Search Service cluster. The user must have the read and write permissions on the database.

              3. Click Save. The Link Management page is displayed.
              -

              Creating an OBS Link

              1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                Figure 1 Selecting a connector type
                -

              2. Select Object Storage Service (OBS) and click Next to configure parameters for the OBS link.

                • Name: Enter a custom link name, for example, obslink.
                • OBS Server and Port: Enter the actual OBS address information.
                • AK and SK: Enter the AK and SK used for logging in to OBS.
                  To obtain an access key, perform the following steps:
                  1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                  2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 2.
                    Figure 2 Clicking Create Access Key
                    +

                    Creating an OBS Link

                    1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                      Figure 1 Selecting a connector type
                      +

                    2. Select Object Storage Service (OBS) and click Next to configure parameters for the OBS link.

                      • Name: Enter a custom link name, for example, obslink.
                      • OBS Server and Port: Enter the actual OBS address information.
                      • AK and SK: Enter the AK and SK used for logging in to OBS.
                        To obtain an access key, perform the following steps:
                        1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                        2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 2.
                          Figure 2 Clicking Create Access Key
                        3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                          • Only two access keys can be added for each user.
                          • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
                        @@ -22,14 +22,14 @@

                    3. Click Save. The Link Management page is displayed.
                    -

                    Creating a Migration Job

                    1. Choose Table/File Migration > Create Job to create a job for exporting data from OBS to Cloud Search Service.

                      Figure 3 Creating a job for migrating data from OBS to Cloud Search Service
                      +

                      Creating a Migration Job

                      1. Choose Table/File Migration > Create Job to create a job for exporting data from OBS to Cloud Search Service.

                        Figure 3 Creating a job for migrating data from OBS to Cloud Search Service
                        • Job Name: Enter a unique name.
                        • Source Job Configuration
                          • Source Link Name: Select the obslink link created in Creating an OBS Link.
                          • Bucket Name: Select the bucket from which the data will be migrated.
                          • Source Directory/File: Set this parameter to the path of the data to be migrated. You can migrate all directories and files in the bucket.
                          • File Format: Select CSV for migrating files to a data table.
                          • Retain the default values of the optional parameters in Show Advanced Attributes.
                        • Destination Job Configuration
                          • Destination Link Name: Select the csslink link created in Creating a Cloud Search Service Link.
                          • Index: Select the Elasticsearch index of the data to be written. You can also enter a new index. CDM automatically creates the index on Cloud Search Service.
                          • Type: Select the Elasticsearch type of the data to be written. You can enter a new type. CDM automatically creates a type at the migration destination.
                          • Retain the default values of the optional parameters in Show Advanced Attributes.

                      2. Click Next. The Map Field page is displayed. CDM automatically matches the source and destination fields. See Figure 4.

                        • If the field mapping is incorrect, you can drag the fields to adjust the mapping.
                        • If the type is automatically created at the migration destination, you need to configure the type and name of each field.
                        • CDM supports field conversion during the migration.
                        -
                        Figure 4 Field mapping of Cloud Search Service
                        +
                        Figure 4 Field mapping of Cloud Search Service

                      3. Click Next and set task parameters. Generally, retain the default values of all parameters.

                        In this step, you can configure the following optional functions:
                        • Retry If Failed: Determine whether to automatically retry the job if it fails. Retain the default value Never.
                        • Group: Select the group to which the job belongs. The default group is DEFAULT. On the Job Management page, jobs can be displayed, started, or exported by group.
                        • Schedule Execution: Determine whether to automatically execute the job at a scheduled time. Retain the default value No in this example.
                        • Concurrent Extractors: Enter the number of concurrent extractors. An appropriate value improves migration efficiency. Retain the default value 1.
                        • Write Dirty Data: Specify this parameter if data that fails to be processed or filtered out during job execution needs to be written to OBS for future viewing. Before writing dirty data, create an OBS link on the CDM console. Retain the default value No so that dirty data is not recorded.
                        -
                        Figure 5 Configuring the task
                        +
                        Figure 5 Configuring the task

                      4. Click Save and Run. The Job Management page is displayed, on which you can view the job execution progress and result.
                      5. After the job is successfully executed, in the Operation column of the job, click Historical Record to view the job's historical execution records and read/write statistics.

                        On the Historical Record page, click Log to view the job logs.

                      @@ -41,3 +41,10 @@
                    + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0089.html b/docs/dataartsstudio/umn/dataartsstudio_01_0089.html index 74cf30452..3be21244e 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0089.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0089.html @@ -10,11 +10,11 @@

                    In this scenario, if the CDM cluster is used only to migrate data from OBS to DLI and does not need to migrate data of other data sources, there is no special requirements on the VPC, subnet, and security group of the CDM cluster. You can specify them based on your needs. CDM accesses DLI and OBS through the intranet. The flavor of the CDM cluster is selected based on the amount of data to be migrated. Generally, cdm.medium meets the requirements for most migration scenarios.

                  Creating a DLI Link

                  1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.
                  2. Select Data Lake Insight, click Next, and configure the DLI link parameters. See Figure 1.

                    • Name: Enter a custom link name, for example, dlilink.
                    • AK and SK: Enter the AK and SK used for accessing the DLI database.
                    • Project ID: Enter the project ID of the region to which DLI belongs.
                    -
                    Figure 1 Creating a DLI link
                    +
                    Figure 1 Creating a DLI link

                  3. Click Save. The Link Management page is displayed.
                  -

                  Creating an OBS Link

                  1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                    Figure 2 Selecting a connector type
                    -

                  2. Select Object Storage Service (OBS) and click Next to configure parameters for the OBS link.

                    • Name: Enter a custom link name, for example, obslink.
                    • OBS Server and Port: Enter the actual OBS address information.
                    • AK and SK: Enter the AK and SK used for logging in to OBS.
                      To obtain an access key, perform the following steps:
                      1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                      2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 3.
                        Figure 3 Clicking Create Access Key
                        +

                        Creating an OBS Link

                        1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                          Figure 2 Selecting a connector type
                          +

                        2. Select Object Storage Service (OBS) and click Next to configure parameters for the OBS link.

                          • Name: Enter a custom link name, for example, obslink.
                          • OBS Server and Port: Enter the actual OBS address information.
                          • AK and SK: Enter the AK and SK used for logging in to OBS.
                            To obtain an access key, perform the following steps:
                            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 3.
                              Figure 3 Clicking Create Access Key
                            3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                              • Only two access keys can be added for each user.
                              • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
                            @@ -22,13 +22,13 @@

                        3. Click Save. The Link Management page is displayed.
                        -

                        Creating a Migration Job

                        1. Choose Table/File Migration > Create Job to create a job for migrating data from OBS to DLI. See Figure 4.

                          Figure 4 Creating a job for migrating data from OBS to DLI
                          +

                          Creating a Migration Job

                          1. Choose Table/File Migration > Create Job to create a job for migrating data from OBS to DLI. See Figure 4.

                            Figure 4 Creating a job for migrating data from OBS to DLI
                            • Job Name: Enter a custom job name.
                            • Source Link Name: Select the obslink link created in Creating an OBS Link.
                              • Bucket Name: Select the bucket from which the data is to be migrated.
                              • Source Directory/File: Set this parameter to the path of the data to be migrated.
                              • File Format: Select CSV or JSON for transferring files to a data table.
                              • Retain the default values of the optional parameters in Show Advanced Attributes.
                            • Destination Link Name: Select the dlilink link created in Creating a DLI Link.
                              • Resource Queue: Enter the resource queue to which the destination table belongs.
                              • Database Name: Enter the name of the database to which data is to be written.
                              • Table Name: Enter the name of the table to which data is to be written. CDM cannot automatically create tables on DLI. The table must be created on DLI in advance, and the field types and formats of the table must be consistent with those of the data to be migrated.
                              • Clear Before Importing Data: Choose whether to clear data in the destination table before data import. In this example, retain the default value.

                          2. Click Next. The Map Field page is displayed. CDM automatically matches the source and destination fields.

                            • If the field mapping is incorrect, you can drag the fields to adjust the mapping.
                            • CDM supports field conversion during the migration.

                          3. Click Next and set task parameters. Generally, retain the default values of all parameters.

                            In this step, you can configure the following optional functions:
                            • Retry If Failed: Determine whether to automatically retry the job if it fails. Retain the default value Never.
                            • Group: Select the group to which the job belongs. The default group is DEFAULT. On the Job Management page, jobs can be displayed, started, or exported by group.
                            • Schedule Execution: Determine whether to automatically execute the job at a scheduled time. Retain the default value No in this example.
                            • Concurrent Extractors: Enter the number of concurrent extractors. An appropriate value improves migration efficiency. Retain the default value 1.
                            • Write Dirty Data: Specify this parameter if data that fails to be processed or filtered out during job execution needs to be written to OBS for future viewing. Before writing dirty data, create an OBS link on the CDM console. Retain the default value No so that dirty data is not recorded.
                            -
                            Figure 5 Configuring the task
                            +
                            Figure 5 Configuring the task

                          4. Click Save and Run. The Job Management page is displayed, on which you can view the job execution progress and result.
                          5. After the job is successfully executed, in the Operation column of the job, click Historical Record to view the job's historical execution records and read/write statistics.

                            On the Historical Record page, click Log to view the job logs.

                          @@ -40,3 +40,10 @@
                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0091.html b/docs/dataartsstudio/umn/dataartsstudio_01_0091.html index 5051350e4..13566eea4 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0091.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0091.html @@ -4,7 +4,7 @@

                        Scenario

                        Cloud Search Service provides users with structured and unstructured data search, statistics, and report capabilities. This section describes how to use CDM to migrate data from the Oracle database to Cloud Search Service. The procedure is as follows:

                        1. Creating a CDM Cluster and Binding an EIP to the Cluster
                        2. Creating a Cloud Search Service Link
                        3. Creating an Oracle Link
                        4. Creating a Migration Job
                        -

                        Prerequisites

                        • You have subscribed to Cloud Search Service and obtained the IP address and port number of the Cloud Search Service cluster.
                        • You have obtained the IP address, name, username, and password of the Oracle database.
                        • If the Oracle database is deployed on an on-premises data center or a third-party cloud, ensure that an IP address that can be accessed from the public network has been configured for the Oracle database, or the VPN or Direct Connect between the on-premises data center and cloud has been established.
                        • You have uploaded the Oracle database driver on the Job Management > Links > Driver Management page.
                        +

                        Prerequisites

                        • You have subscribed to Cloud Search Service and obtained the IP address and port number of the Cloud Search Service cluster.
                        • You have obtained the IP address, name, username, and password of the Oracle database.
                        • If the Oracle database is deployed on an on-premises data center or a third-party cloud, ensure that an IP address that can be accessed from the public network has been configured for the Oracle database, or the VPN or Direct Connect between the on-premises data center and has been established.
                        • You have uploaded the Oracle database driver on the Job Management > Links > Driver Management page.

                        Creating a CDM Cluster and Binding an EIP to the Cluster

                        1. Create a CDM cluster.

                          The key configurations are as follows:
                          • The flavor of the CDM cluster is selected based on the amount of data to be migrated. Generally, cdm.medium meets the requirements for most migration scenarios.
                          • The CDM and Cloud Search Service clusters must be in the same VPC. In addition, it is recommended that the CDM cluster be in the same subnet and security group as the Cloud Search Service cluster.
                          • If the same subnet and security group cannot be used for security purposes, ensure that a security group rule has been configured to allow the CDM cluster to access the Cloud Search Service cluster.
                          @@ -18,14 +18,14 @@

                          Creating an Oracle Link

                          1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.
                          2. Select Oracle and click Next to configure parameters for the Oracle link.

                            • Name: Enter a custom link name, for example, oracle_link.
                            • Database Server and Port: Enter the address and port number of the Oracle server.
                            • Database Name: Enter the name of the Oracle database whose data is to be exported.
                            • Username and Password: Enter the username and password used for logging in to the Oracle database. The user must have the permission to read the Oracle metadata.

                          3. Click Save. The Link Management page is displayed.
                          -

                          Creating a Migration Job

                          1. Choose Table/File Migration > Create Job to create a job for exporting data from the Oracle database to Cloud Search Service.

                            Figure 1 Creating a job for migrating data from Oracle to Cloud Search Service
                            +

                            Creating a Migration Job

                            1. Choose Table/File Migration > Create Job to create a job for exporting data from the Oracle database to Cloud Search Service.

                              Figure 1 Creating a job for migrating data from Oracle to Cloud Search Service
                              • Job Name: Enter a unique name.
                              • Source Job Configuration
                                • Source Link Name: Select the oracle_link link created in Creating an Oracle Link.
                                • Schema/Tablespace: Enter the name of the database whose data is to be migrated.
                                • Table Name: Enter the name of the table to be migrated.
                                • Retain the default values of the optional parameters in Show Advanced Attributes.
                              • Destination Job Configuration
                                • Destination Link Name: Select the csslink link created in Creating a Cloud Search Service Link.
                                • Index: Select the Elasticsearch index of the data to be written. You can also enter a new index. CDM automatically creates the index on Cloud Search Service.
                                • Type: Select the Elasticsearch type of the data to be written. You can enter a new type. CDM automatically creates a type at the migration destination.
                                • Retain the default values of the optional parameters in Show Advanced Attributes.

                            2. Click Next. The Map Field page is displayed. CDM automatically matches the source and destination fields, as shown in Figure 2.

                              • If the field mapping is incorrect, you can drag the fields to adjust the mapping.
                              • If the type is automatically created at the migration destination, you need to configure the type and name of each field.
                              • CDM supports field conversion during the migration.
                              -
                              Figure 2 Field mapping of Cloud Search Service
                              +
                              Figure 2 Field mapping of Cloud Search Service

                            3. Click Next and set task parameters. Generally, retain the default values of all parameters.

                              In this step, you can configure the following optional functions:
                              • Retry If Failed: Determine whether to automatically retry the job if it fails. Retain the default value Never.
                              • Group: Select the group to which the job belongs. The default group is DEFAULT. On the Job Management page, jobs can be displayed, started, or exported by group.
                              • Schedule Execution: Determine whether to automatically execute the job at a scheduled time. Retain the default value No in this example.
                              • Concurrent Extractors: Enter the number of concurrent extractors. An appropriate value improves migration efficiency. Retain the default value 1.
                              • Write Dirty Data: Specify this parameter if data that fails to be processed or filtered out during job execution needs to be written to OBS for future viewing. Before writing dirty data, create an OBS link on the CDM console. Retain the default value No so that dirty data is not recorded.
                              -
                              Figure 3 Configuring the task
                              +
                              Figure 3 Configuring the task

                            4. Click Save and Run. The Job Management page is displayed, on which you can view the job execution progress and result.
                            5. After the job is successfully executed, in the Operation column of the job, click Historical Record to view the job's historical execution records and read/write statistics.

                              On the Historical Record page, click Log to view the job logs.

                            @@ -37,3 +37,10 @@
                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0092.html b/docs/dataartsstudio/umn/dataartsstudio_01_0092.html index 0bc834a12..5b37edce1 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0092.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0092.html @@ -6,7 +6,7 @@

                          Hive partitions are implemented by using the HDFS subdirectory function. Each subdirectory contains the column names and values of each partition. If there are multiple partitions, many HDFS subdirectories exist. It is not easy to load external data to each partition of the Hive table without relying on tools. With CDM, you can easily load data of the external data sources (relational databases, object storage services, and file system services) to Hive partition tables.

                          This section describes how to migrate data from the MySQL database to the MRS Hive partition table.

                          Scenario

                          Suppose that there is a trip_data table in the MySQL database. The table stores cycling records such as the start time, end time, start sites, end sites, and rider IDs. For details about the fields in the trip_data table, see Figure 1.

                          -
                          Figure 1 MySQL table fields
                          +
                          Figure 1 MySQL table fields

                          The following describes how to use CDM to import the trip_data table in the MySQL database to the MRS Hive partition table. The procedure is as follows:

                          1. Creating a Hive Partition Table on MRS Hive
                          2. Creating a CDM Cluster and Binding an EIP to the Cluster
                          3. Creating a MySQL Link
                          4. Creating a Hive Link
                          5. Creating a Migration Job
                          @@ -24,8 +24,8 @@

                      -

                      Creating a MySQL Link

                      1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.
                      2. Select RDS for MySQL and click Next to set the link parameters.

                        Figure 2 Creating a MySQL Link
                        -

                        Click Show Advanced Attributes to view more optional parameters. For details, see Link to an RDS for MySQL/MySQL Database. Retain the default values for the optional parameters and configure the mandatory parameters described in Table 1.

                        +

                        Creating a MySQL Link

                        1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.
                        2. Select RDS for MySQL and click Next to set the link parameters.

                          Figure 2 Creating a MySQL Link
                          +

                          Click Show Advanced Attributes to view more optional parameters. For details, see RDS for MySQL/MySQL Database Link Parameters. Retain the default values for the optional parameters and configure the mandatory parameters described in Table 1.

                          @@ -112,7 +112,7 @@

                          -

                          Creating a Hive Link

                          1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                            Figure 3 Selecting a connector type
                            +

                            Creating a Hive Link

                            1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                              Figure 3 Selecting a connector type

                            2. Select MRS Hive and click Next to configure parameters for the MRS Hive link.

                              Table 2 lists the parameters. Configure these parameters based on your actual situation.

                          Table 1 MySQL link parameters

                          Parameter

                          - @@ -179,7 +181,7 @@ - -
                          Table 2 MRS Hive link parameters

                          Parameter

                          @@ -132,7 +132,9 @@

                          Manager IP

                          Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.

                          +
                          Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
                          NOTE:

                          DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                          +
                          +

                          127.0.0.1

                          ldapUsername

                          This parameter is mandatory when Enable ldap is enabled.

                          +

                          This parameter is mandatory when Enable ldap is enabled.

                          Enter the username configured when LDAP authentication was enabled for MRS Hive.

                          -

                          @@ -187,7 +189,7 @@

                          ldapPassword

                          This parameter is mandatory when Enable ldap is enabled.

                          +

                          This parameter is mandatory when Enable ldap is enabled.

                          Enter the password configured when LDAP authentication was enabled for MRS Hive.

                          -

                          @@ -204,7 +206,7 @@

                          This parameter is mandatory when OBS storage support is enabled. The account corresponding to the AK/SK pair must have the OBS Buckets Viewer permission. Otherwise, OBS cannot be accessed and the "403 AccessDenied" error is reported.

                          You need to create an access key for the current account and obtain an AK/SK pair.

                          -
                          1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                          2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 4.
                            Figure 4 Clicking Create Access Key
                            +
                            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 4.
                              Figure 4 Clicking Create Access Key
                            3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                              NOTE:
                              • Only two access keys can be added for each user.
                              • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
                            @@ -257,16 +259,16 @@

                            Creating a Migration Job

                            1. Click the Table/File Migration tab and then Create Job.

                              Set Clear Data Before Import to Yes, so that the data in the Hive table will be cleared before data import.

                            2. After configuring the parameters, click Next to go to the Map Field page shown in Figure 5.

                              Map the fields of the MySQL table and Hive table. The Hive table has three more fields y, ym, and ymd than the MySQL table, which are the Hive partition fields. Because the fields of the source table cannot be directly mapped to the destination table, you need to configure an expression to extract data from the StartDate field in the source table.

                              -
                              Figure 5 Hive field mapping
                              -

                            3. Click to display the Converter List dialog box, and then choose Create Converter > Expression conversion. See Figure 6.

                              The expressions for the y, ym, and ymd fields are as follows:

                              +
                              Figure 5 Hive field mapping
                              +

                            4. Click to display the Converter List dialog box, and then choose Create Converter > Expression conversion. See Figure 6.

                              The expressions for the y, ym, and ymd fields are as follows:

                              DateUtils.format(DateUtils.parseDate(row[2],"yyyy-MM-dd HH:mm:ss.SSS"),"yyyy")

                              DateUtils.format(DateUtils.parseDate(row[2],"yyyy-MM-dd HH:mm:ss.SSS"),"yyyyMM")

                              DateUtils.format(DateUtils.parseDate(row[2],"yyyy-MM-dd HH:mm:ss.SSS"),"yyyyMMdd")

                              -
                              Figure 6 Configuring the expression
                              +
                              Figure 6 Configuring the expression

                              The expressions in CDM support field conversion of common character strings, dates, and values.

                            5. Click Next and set task parameters. Generally, retain the default values of all parameters.

                              In this step, you can configure the following optional functions:
                              • Retry If Failed: Determine whether to automatically retry the job if it fails. Retain the default value Never.
                              • Group: Select the group to which the job belongs. The default group is DEFAULT. On the Job Management page, jobs can be displayed, started, or exported by group.
                              • Schedule Execution: Determine whether to automatically execute the job at a scheduled time. Retain the default value No in this example.
                              • Concurrent Extractors: Enter the number of concurrent extractors. An appropriate value improves migration efficiency. Retain the default value 1.
                              • Write Dirty Data: Specify this parameter if data that fails to be processed or filtered out during job execution needs to be written to OBS for future viewing. Before writing dirty data, create an OBS link on the CDM console. Retain the default value No so that dirty data is not recorded.
                              -
                              Figure 7 Configuring the task
                              +
                              Figure 7 Configuring the task

                            6. Click Save and Run. The Job Management page is displayed, on which you can view the job execution progress and result.
                            7. After the job is successfully executed, in the Operation column of the job, click Historical Record to view the job's historical execution records and read/write statistics.

                              On the Historical Record page, click Log to view the job logs.

                            @@ -278,3 +280,10 @@
                            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0098.html b/docs/dataartsstudio/umn/dataartsstudio_01_0098.html index b799ca4a4..89d0e72a2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0098.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0098.html @@ -13,85 +13,84 @@

                          -

                          Creating a MySQL Link

                          1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.
                          2. Select RDS for MySQL and click Next to set the link parameters.

                            Figure 1 Creating a MySQL link
                            -

                            Click Show Advanced Attributes to view more optional parameters. For details, see Link to an RDS for MySQL/MySQL Database. Retain the default values of the optional parameters and configure the mandatory parameters according to Table 1.

                            +

                            Creating a MySQL Link

                            1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.
                            2. Select MySQL and click Next. On the displayed page, configure MySQL link parameters.

                              Click Show Advanced Attributes to view more optional parameters. For details, see RDS for MySQL/MySQL Database Link Parameters. Retain the default values of the optional parameters and configure the mandatory parameters according to Table 1.

                              -
                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0502.html b/docs/dataartsstudio/umn/dataartsstudio_01_0502.html index 72eef475d..2a6340f83 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0502.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0502.html @@ -7,7 +7,7 @@

                              The tables involved in this example are as follows:

                              • trade_log: This table records data generated in each transaction.
                              • trade_report: This table is generated based on trade_log and records the daily transaction summary.
                              -

                              Prerequisites

                              • A DLI data connection named dli_demo has been created.

                                If this data connection is not created, create one. For details, see Managing Data Connections.

                                +

                                Prerequisites

                                • A DLI data connection named dli_demo has been created.

                                  If this data connection is not created, create one. For details, see Configuring DataArts Studio Data Connection Parameters.

                                • A database named dli_db has been created in DLI.

                                  If this database is not created, create one. For details, see Creating a Database.

                                • Tables trade_log and trade_report have been created in the dli_db database.

                                  If the tables are not created, create them. For details, see Creating a Table.

                                @@ -22,7 +22,7 @@ FROM trade_log where date_format(trade_time, 'yyyy-MM-dd') = '${yesterday}' -
                              • Click and set the script name to generate_trade_report.
                              • +
                              • Click and set the script name to generate_trade_report.
                              • Create and develop a job.

                                1. In the left navigation pane on the DataArts Factory console, choose Data Development > Develop Job and click Create Job to create an empty job named job.
                                2. Go to the job development page, drag the DLI SQL node to the canvas, click the icon, and configure node properties.

                                  Description of key properties:

                                  • SQL Script: SQL script generate_trade_report that is developed in 1.
                                  • Database Name: Database configured in SQL script generate_trade_report.
                                  • Queue Name: Resource queue configured in SQL script generate_trade_report.
                                  • Script Parameter: Parameter yesterday configured in SQL script generate_trade_report. Enter the following EL expression as the parameter values:
                                    #{Job.getYesterday("yyyy-MM-dd")}

                                    Expression Description: The job object uses the getYesterday method to obtain the time of the day before the job plan execution time. The time format is yyyy-MM-dd.

                                    @@ -36,7 +36,7 @@ FROM where date_format(trade_time, 'yyyy-MM-dd') = '2018-09-25'
                                  -
                                3. Click to test the running job.
                                4. After the job test is complete, click to save the job configuration.
                                +
                              • Click to test the running job.
                              • After the job test is complete, click to save the job configuration.
                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0503.html b/docs/dataartsstudio/umn/dataartsstudio_01_0503.html index 1ffe23d79..3ee8fb7b2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0503.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0503.html @@ -6,7 +6,7 @@

                              You can perform the following operations on a solution:

                              Creating a Solution

                              On the development page of DLF, create a solution, set the solution name, and select business-related jobs.

                              -
                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                              3. In the navigation tree on the left of the data development page, choose Development > Develop Script or Data Development > Develop Job.
                              4. Above the directory on the left, click to show the solution directory.
                              5. Click in the upper part of the solution directory. The Create Solution page is displayed. Table 1 describes the solution parameters. +
                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                3. In the navigation tree on the left of the data development page, choose Development > Develop Script or Data Development > Develop Job.
                                4. Above the directory on the left, click to show the solution directory.
                                5. Click in the upper part of the solution directory. The Create Solution page is displayed. Table 1 describes the solution parameters.
                              Table 1 MySQL link parameters

                              Parameter

                              +
                              - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - @@ -101,13 +100,13 @@

                              -

                              Creating an RDS Link

                              1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                                Figure 2 Selecting a connector type
                                +

                                Creating an RDS Link

                                1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                                  Figure 1 Selecting a connector type

                                2. Select RDS for MySQL and click Next to configure parameters for the RDS for MySQL link.

                                  • Name: Enter a custom link name, for example, rds_link.
                                  • Database Server and Port: Enter the address information about the RDS for MySQL database.
                                  • Database Name: Enter the name of the RDS for MySQL database.
                                  • Username and Password: Enter the username and password used for logging in to the database.
                                  • During RDS link creation, if Use Local API in Show Advanced Attributes is set to Yes, you can use the LOAD DATA function provided by MySQL to speed up data import.
                                  • The LOAD DATA function is disabled by default on RDS for MySQL, so you need to modify the parameter group of the MySQL instance and set local_infile to ON to enable this function.
                                  • If the local_infile parameter group cannot be edited, it is the default parameter group. You need to create a parameter group and modify its value, and apply it to the MySQL instance of RDS.

                                3. Click Save. The Link Management page is displayed.
                                -

                                Creating an Entire DB Migration Job

                                1. After the two links are created, choose Entire DB Migration > Create Job to create a migration job. See Figure 3.

                                  Figure 3 Creating an entire DB migration job
                                  +

                                  Creating an Entire DB Migration Job

                                  1. After the two links are created, choose Entire DB Migration > Create Job to create a migration job. See Figure 2.

                                    Figure 2 Creating an entire DB migration job
                                    • Job Name: Enter a name for the entire DB migration job.
                                    • Source Job Configuration
                                      • Source Link Name: Select the mysqllink created in Creating a MySQL Link.
                                      • Schema/Tablespace: Select the on-premises MySQL database from which data is to be exported.
                                    • Destination Job Configuration
                                      • Destination Link Name: Select the rds_link link created in Creating an RDS Link.
                                      • Schema/Tablespace: Select the name of the RDS database to which data is to be imported.
                                      • Auto Table Creation: Select Auto creation, which indicates that CDM automatically creates tables in the RDS database when tables of the on-premises MySQL database do not exist in the RDS database.
                                      • Clear Data Before Import: Select Yes, which indicates that when a table with the same name as the table in the on-premises MySQL database exists in the RDS database, CDM clears data in the table on RDS.
                                      • Constraint Conflict Handling: Select insert into.
                                      • Retain the default values of the optional parameters in Show Advanced Attributes.
                                    @@ -122,3 +121,10 @@
                                + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0099.html b/docs/dataartsstudio/umn/dataartsstudio_01_0099.html index b8ee06d29..a0e7d116b 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0099.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0099.html @@ -4,7 +4,7 @@

                                Scenario

                                CSS provides users with structured and unstructured data search, statistics, and report capabilities. This section describes how to use CDM to migrate the entire Elasticsearch database to Cloud Search Service. The procedure is as follows:

                                1. Creating a CDM Cluster and Binding an EIP to the Cluster
                                2. Creating a Cloud Search Service Link
                                3. Creating an Elasticsearch Link
                                4. Creating an Entire DB Migration Job
                                -

                                Prerequisites

                                • You have sufficient EIP quota.
                                • You have subscribed to CSS and obtained the IP address and port number of the CSS cluster.
                                • You have obtained the IP address, port number, username, and password of the on-premises Elasticsearch database server.

                                  If the Elasticsearch server is deployed on an on-premises data center or a third-party cloud, ensure that an IP address that can be accessed from the public network has been configured for the Elasticsearch server, or the VPN or Direct Connect between the on-premises data center and cloud has been established.

                                  +

                                  Prerequisites

                                  • You have sufficient EIP quota.
                                  • You have subscribed to CSS and obtained the IP address and port number of the CSS cluster.
                                  • You have obtained the IP address, port number, username, and password of the on-premises Elasticsearch database server.

                                    If the Elasticsearch server is deployed on an on-premises data center or a third-party cloud, ensure that an IP address that can be accessed from the public network has been configured for the Elasticsearch server, or the VPN or Direct Connect between the on-premises data center and has been established.

                                  Creating a CDM Cluster and Binding an EIP to the Cluster

                                  1. Create a CDM cluster.

                                    The key configurations are as follows:
                                    • The flavor of the CDM cluster is selected based on the amount of data to be migrated. Generally, cdm.medium meets the requirements for most migration scenarios.
                                    • The CDM and Cloud Search Service clusters must be in the same VPC. In addition, it is recommended that the CDM cluster be in the same subnet and security group as the Cloud Search Service cluster.
                                    • If the same subnet and security group cannot be used for security purposes, ensure that a security group rule has been configured to allow the CDM cluster to access the Cloud Search Service cluster.
                                    @@ -19,12 +19,12 @@

                                    Creating an Elasticsearch Link

                                    1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.
                                    2. Select Elasticsearch and click Next to configure parameters for the Elasticsearch link. The parameters are the same as those for the CSS link.

                                      • Name: Enter a custom link name, for example, es_link.
                                      • Elasticsearch Server List: Enter the IP address and port number of the on-premises Elasticsearch database. Use semicolons to separate multiple addresses.

                                    3. Click Save. The Link Management page is displayed.
                                    -

                                    Creating an Entire DB Migration Job

                                    1. Choose Entire DB Migration > Create Job to create an entire DB migration job.

                                      Figure 1 Creating an entire DB migration job
                                      +

                                      Creating an Entire DB Migration Job

                                      1. Choose Entire DB Migration > Create Job to create an entire DB migration job.

                                        Figure 1 Creating an entire DB migration job
                                        • Job Name: Enter a unique name.
                                        • Source Job Configuration
                                          • Source Link Name: Select the es_link link created in Creating an Elasticsearch Link.
                                          • Index: Click the icon next to the text box to select an index in the on-premises Elasticsearch database or manually enter an index name. The name can contain only lowercase letters. If multiple indexes need to be migrated at a time, set this parameter to a wildcard character. CDM migrates all indexes that meet the wildcard condition. For example, if this parameter is set to cdm*, CDM migrates all indexes starting with cdm, such as cdm01, cdmB3, cdm_45 and so on.
                                        • Destination Job Configuration
                                          • Destination Link Name: Select the csslink link created in Creating a Cloud Search Service Link.
                                          • Index: Enter the index of the data to be written. You can select an existing index in Cloud Search Service or manually enter an index name that does not exist. The name can contain only lowercase letters. CDM automatically creates the index in Cloud Search Service. If multiple indexes are migrated at a time, this parameter cannot be configured. CDM automatically creates indexes at the migration destination.
                                          • Clear Data Before Import: If the selected index already exists in Cloud Search Service, you can choose whether to clear the data in the index before importing data. If you select No, the data is added to the index.

                                      1. Click Save and Run. The Job Management page is displayed, on which you can view the job execution progress and result.

                                        A sub-job will be generated for each type in the on-premises Elasticsearch index for concurrent execution. You can click the job name to view the sub-job progress.

                                        -

                                      1. After the job is successfully executed, in the Operation column of the job, click Historical Record to view the job's historical execution records, read/write statistics, and job logs (only the sub-jobs have job logs).

                                        Figure 2 Historical Record
                                        +

                                      1. After the job is successfully executed, in the Operation column of the job, click Historical Record to view the job's historical execution records, read/write statistics, and job logs (only the sub-jobs have job logs).

                                        Figure 2 Historical Record

                                    @@ -34,3 +34,10 @@
                                  + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0100.html b/docs/dataartsstudio/umn/dataartsstudio_01_0100.html index b756cc6e4..ab3f6ad83 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0100.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0100.html @@ -12,85 +12,84 @@

                              -

                              Creating a MySQL Link

                              1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.
                              2. Select RDS for MySQL and click Next to set the link parameters.

                                Figure 1 Creating a MySQL link
                                -

                                Click Show Advanced Attributes to view more optional parameters. For details, see Link to an RDS for MySQL/MySQL Database. Retain the default values of the optional parameters and configure the mandatory parameters according to Table 1.

                                +

                                Creating a MySQL Link

                                1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.
                                2. Select MySQL and click Next. On the displayed page, configure MySQL link parameters.

                                  Click Show Advanced Attributes to view more optional parameters. For details, see RDS for MySQL/MySQL Database Link Parameters. Retain the default values of the optional parameters and configure the mandatory parameters according to Table 1.

                                  -
                              Table 1 MySQL link parameters

                              Parameter

                              Description

                              +

                              Description

                              Example Value

                              +

                              Example Value

                              Name

                              +

                              Name

                              Unique link name

                              +

                              Unique link name

                              mysqllink

                              +

                              mysqllink

                              Database Server

                              +

                              Database Server

                              IP address or domain name of the MySQL database server

                              +

                              IP address or domain name of the MySQL database server

                              -

                              +

                              -

                              Port

                              +

                              Port

                              MySQL database port

                              +

                              MySQL database port

                              3306

                              +

                              3306

                              Database Name

                              +

                              Database Name

                              Name of the MySQL database

                              +

                              Name of the MySQL database

                              sqoop

                              +

                              sqoop

                              Username

                              +

                              Username

                              User who has the read, write, and delete permissions on the MySQL database

                              +

                              User who has the read, write, and delete permissions on the MySQL database

                              admin

                              +

                              admin

                              Password

                              +

                              Password

                              Password of the user

                              +

                              Password of the user

                              -

                              +

                              -

                              Use Local API

                              +

                              Use Local API

                              Whether to use the local API of the database for acceleration. (The system attempts to enable the local_infile system variable of the MySQL database.)

                              +

                              Whether to use the local API of the database for acceleration. (The system attempts to enable the local_infile system variable of the MySQL database.)

                              Yes

                              +

                              Yes

                              Use Agent

                              +

                              Use Agent

                              Whether to extract data from the data source through an agent

                              +

                              The agent function will be unavailable soon and does not need to be configured.

                              No

                              +

                              -

                              local_infile Character Set

                              +

                              local_infile Character Set

                              When using local_infile to import data to MySQL, you can configure the encoding format.

                              +

                              When using local_infile to import data to MySQL, you can configure the encoding format.

                              utf8

                              +

                              utf8

                              Driver Version

                              +

                              Driver Version

                              Before connecting CDM to a relational database, you need to upload the JDK 8 .jar driver of the relational database. Download the MySQL driver 5.1.48 from https://downloads.mysql.com/archives/c-j/, obtain mysql-connector-java-5.1.48.jar, and upload it.

                              +

                              Before connecting CDM to a relational database, you need to upload the JDK 8 .jar driver of the relational database. Download the MySQL driver 5.1.48 from https://downloads.mysql.com/archives/c-j/, obtain mysql-connector-java-5.1.48.jar, and upload it.

                              -

                              +

                              -

                              - - - - + + + - + + + + - @@ -72,7 +72,7 @@ - @@ -83,7 +83,7 @@

                              This method only obtains the parameter values configured for the current job, but not parameter values passed from the parent job or the global variables configured for the workspace.

                              To obtain the parameter values passed from the parent job and the global variables configured for the workspace, you are advised to use the ${job_param_name} expression.

                              - @@ -91,7 +91,7 @@ - @@ -99,7 +99,7 @@ - @@ -107,7 +107,7 @@ - @@ -116,7 +116,7 @@ - @@ -124,7 +124,7 @@ - @@ -133,7 +133,7 @@ - @@ -142,10 +142,46 @@ - + + + + + + + + + + + + + + + +
                              Table 1 MySQL link parameters

                              Parameter

                              +
                              - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - @@ -100,8 +99,8 @@

                              -

                              Creating an OBS Link

                              1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                                Figure 2 Selecting a connector type
                                -

                              2. Select Object Storage Service (OBS) and click Next to configure parameters for the OBS link.

                                • Name: Enter a custom link name, for example, obslink.
                                • OBS Server and Port: Enter the actual OBS address information.
                                • AK and SK: Enter the AK and SK used for logging in to OBS.
                                  To obtain an access key, perform the following steps:
                                  1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                  2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 3.
                                    Figure 3 Clicking Create Access Key
                                    +

                                    Creating an OBS Link

                                    1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                                      Figure 1 Selecting a connector type
                                      +

                                    2. Select Object Storage Service (OBS) and click Next to configure parameters for the OBS link.

                                      • Name: Enter a custom link name, for example, obslink.
                                      • OBS Server and Port: Enter the actual OBS address information.
                                      • AK and SK: Enter the AK and SK used for logging in to OBS.
                                        To obtain an access key, perform the following steps:
                                        1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                        2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 2.
                                          Figure 2 Clicking Create Access Key
                                        3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                                          • Only two access keys can be added for each user.
                                          • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
                                        @@ -109,12 +108,12 @@

                                    3. Click Save. The Link Management page is displayed.
                                    -

                                    Creating a Migration Job

                                    1. Choose Table/File Migration > Create Job to create a job for exporting data from the MySQL database to OBS.

                                      Figure 4 Creating a job for migrating data from MySQL to OBS
                                      +

                                      Creating a Migration Job

                                      1. Choose Table/File Migration > Create Job to create a job for exporting data from the MySQL database to OBS.

                                        Figure 3 Creating a job for migrating data from MySQL to OBS
                                        • Job Name: Enter a unique name.
                                        • Source Job Configuration
                                          • Source Link Name: Select the mysqllink created in Creating a MySQL Link.
                                          • Use SQL Statement: Select No.
                                          • Schema/Tablespace: name of the schema or tablespace from which data is to be extracted
                                          • Table Name: name of the table from which data is to be extracted
                                          • Retain the default values of other optional parameters.
                                        • Destination Job Configuration
                                          • Destination Link Name: Select the obslink created in Creating an OBS Link.
                                          • Bucket Name: Select the bucket from which the data will be migrated.
                                          • Write Directory: Enter the directory to which data is to be written on the OBS server.
                                          • File Format: Select CSV.
                                          • Retain the default values of the optional parameters in Show Advanced Attributes.
                                        -

                                      2. Click Next. The Map Field page is displayed. CDM automatically matches the source and destination fields, as shown in Figure 5.

                                        • If the field mapping is incorrect, you can drag the fields to adjust the mapping.
                                        • The expressions in CDM support field conversion of common character strings, dates, and values.
                                        -
                                        Figure 5 Table-to-file field mapping
                                        +

                                      3. Click Next. The Map Field page is displayed. CDM automatically matches the source and destination fields, as shown in Figure 4.

                                        • If the field mapping is incorrect, you can drag the fields to adjust the mapping.
                                        • The expressions in CDM support field conversion of common character strings, dates, and values.
                                        +
                                        Figure 4 Table-to-file field mapping

                                      4. Click Next and set task parameters. Generally, retain the default values of all parameters.

                                        In this step, you can configure the following optional functions:
                                        • Retry Upon Failure: If the job fails to be executed, you can determine whether to automatically retry. Retain the default value Never.
                                        • Group: Select the group to which the job belongs. The default group is DEFAULT. On the Job Management page, jobs can be displayed, started, or exported by group.
                                        • Schedule Execution: Enable it if you need to configure scheduled jobs. Retain the default value No.
                                        • Concurrent Extractors: Enter the number of extractors to be concurrently executed. CDM supports concurrent extraction of MySQL data. If indexes are configured for the source table, you can increase the number of concurrent extractors to accelerate the migration.
                                        • Write Dirty Data: Specify this parameter if data that fails to be processed or filtered out during job execution needs to be written to OBS for future viewing. Before writing dirty data, create an OBS link. For file-to-table data migration, you are advised to write dirty data.
                                        • Delete Job After Completion: Retain the default value Do not delete. You can also set this parameter to Delete to prevent an accumulation of too many migration jobs.

                                      5. Click Save and Run. The Job Management page is displayed, on which you can view the job execution progress and result.
                                      6. After the job is successfully executed, in the Operation column of the job, click Historical Record to view the job's historical execution records and read/write statistics.

                                        On the Historical Record page, click Log to view the job logs.

                                        @@ -127,3 +126,10 @@
                                    + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0101.html b/docs/dataartsstudio/umn/dataartsstudio_01_0101.html index 6a7eafad9..e84bfd5e0 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0101.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0101.html @@ -12,85 +12,84 @@

                              -

                              Creating a MySQL Link

                              1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.
                              2. Select RDS for MySQL and click Next to set the link parameters.

                                Figure 1 Creating a MySQL link
                                -

                                Click Show Advanced Attributes to view more optional parameters. For details, see Link to an RDS for MySQL/MySQL Database. Retain the default values of the optional parameters and configure the mandatory parameters according to Table 1.

                                +

                                Creating a MySQL Link

                                1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.
                                2. Select MySQL and click Next. On the displayed page, configure MySQL link parameters.

                                  Click Show Advanced Attributes to view more optional parameters. For details, see RDS for MySQL/MySQL Database Link Parameters. Retain the default values of the optional parameters and configure the mandatory parameters according to Table 1.

                                  -
                              Table 1 MySQL link parameters

                              Parameter

                              Description

                              +

                              Description

                              Example Value

                              +

                              Example Value

                              Name

                              +

                              Name

                              Unique link name

                              +

                              Unique link name

                              mysqllink

                              +

                              mysqllink

                              Database Server

                              +

                              Database Server

                              IP address or domain name of the MySQL database server

                              +

                              IP address or domain name of the MySQL database server

                              -

                              +

                              -

                              Port

                              +

                              Port

                              MySQL database port

                              +

                              MySQL database port

                              3306

                              +

                              3306

                              Database Name

                              +

                              Database Name

                              Name of the MySQL database

                              +

                              Name of the MySQL database

                              sqoop

                              +

                              sqoop

                              Username

                              +

                              Username

                              User who has the read, write, and delete permissions on the MySQL database

                              +

                              User who has the read, write, and delete permissions on the MySQL database

                              admin

                              +

                              admin

                              Password

                              +

                              Password

                              Password of the user

                              +

                              Password of the user

                              -

                              +

                              -

                              Use Local API

                              +

                              Use Local API

                              Whether to use the local API of the database for acceleration. (The system attempts to enable the local_infile system variable of the MySQL database.)

                              +

                              Whether to use the local API of the database for acceleration. (The system attempts to enable the local_infile system variable of the MySQL database.)

                              Yes

                              +

                              Yes

                              Use Agent

                              +

                              Use Agent

                              Whether to extract data from the data source through an agent

                              +

                              The agent function will be unavailable soon and does not need to be configured.

                              No

                              +

                              -

                              local_infile Character Set

                              +

                              local_infile Character Set

                              When using local_infile to import data to MySQL, you can configure the encoding format.

                              +

                              When using local_infile to import data to MySQL, you can configure the encoding format.

                              utf8

                              +

                              utf8

                              Driver Version

                              +

                              Driver Version

                              Before connecting CDM to a relational database, you need to upload the JDK 8 .jar driver of the relational database. Download the MySQL driver 5.1.48 from https://downloads.mysql.com/archives/c-j/, obtain mysql-connector-java-5.1.48.jar, and upload it.

                              +

                              Before connecting CDM to a relational database, you need to upload the JDK 8 .jar driver of the relational database. Download the MySQL driver 5.1.48 from https://downloads.mysql.com/archives/c-j/, obtain mysql-connector-java-5.1.48.jar, and upload it.

                              -

                              +

                              -

                              + + + + + + @@ -167,7 +213,7 @@ + + + + + + + + + + + +
                              Table 1 MySQL link parameters

                              Parameter

                              +
                              - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - @@ -153,14 +152,14 @@ - - - @@ -177,12 +176,12 @@

                            3. Click Save.
                            4. -

                              Creating a Migration Job

                              1. Choose Table/File Migration > Create Job to create a job for exporting data from the MySQL database to DWS.

                                Figure 2 Creating a job for migrating data from MySQL to DWS
                                +

                                Creating a Migration Job

                                1. Choose Table/File Migration > Create Job to create a job for exporting data from the MySQL database to DWS.

                                  Figure 1 Creating a job for migrating data from MySQL to DWS
                                  • Job Name: Enter a unique name.
                                  • Source Job Configuration
                                    • Source Link Name: Select the mysqllink created in Creating a MySQL Link.
                                    • Use SQL Statement: Select No.
                                    • Schema/Tablespace: name of the schema or tablespace from which data is to be extracted
                                    • Table Name: name of the table from which data is to be extracted
                                    • Retain the default values of other optional parameters.
                                    -
                                  • Destination Job Configuration
                                    • Destination Link Name: Select the dwslink created in Creating a DWS Link.
                                    • Schema/Tablespace: Select the DWS database to which data is to be written.
                                    • Auto Table Creation: This parameter is displayed only when both the migration source and destination are relational databases.
                                    • Table Name: Name of the table to which data is to be written. You can enter a table name that does not exist. CDM automatically creates the table in DWS.
                                    • isCompress: whether to compress data. If you select Yes, high-level compression will be performed. CDM applies to compression scenarios where the I/O read/write volume is large and the CPU is sufficient (the computing load is relatively low).
                                    • Orientation: You can create row- or column-store tables as needed. Generally, if a table contains many columns (called a wide table) and its query involves only a few columns, column storage is recommended. If a table contains only a few columns and a query includes most of the fields, row storage is recommended.
                                    • Extend char length: If the data encoding formats of the migration source and destination are different, the character length of the automatic table creation may be insufficient. If you select Yes for this parameter, the character length will be increased by three times during automatic table creation.
                                    • Clear Data Before Import: whether to clear data in the destination table before the migration task starts.
                                    +
                                  • Destination Job Configuration
                                    • Destination Link Name: Select the dwslink created in Creating a DWS Link.
                                    • Schema/Tablespace: Select the DWS database to which data is to be written.
                                    • Auto Table Creation: This parameter is displayed only when both the migration source and destination are relational databases.
                                    • Table Name: Name of the table to which data is to be written. You can enter a table name that does not exist. CDM automatically creates the table in DWS.
                                    • isCompress: whether to compress data. If you select Yes, high-level compression will be performed. CDM applies to compression scenarios where the I/O read/write volume is large and the CPU is sufficient (the computing load is relatively low).
                                    • Orientation: You can create row- or column-store tables as needed. Generally, if a table contains many columns (called a wide table) and its query involves only a few columns, column storage is recommended. If a table contains only a few columns and a query includes most of the fields, row storage is recommended.
                                    • Extend char length: If the data encoding formats of the migration source and destination are different, the character length of the automatic table creation may be insufficient. If you select Yes for this parameter, the character length will be increased by three times during automatic table creation.
                                    • Clear Data Before Import: whether to clear data in the destination table before the migration task starts.
                                  -

                                2. Click Next. The Map Field page is displayed. CDM automatically matches the source and destination fields, as shown in Figure 3.

                                  • If the field mapping is incorrect, you can drag the fields to adjust the mapping.
                                  • The expressions in CDM support field conversion of common character strings, dates, and values.
                                  -
                                  Figure 3 Table-to-table field mapping
                                  +

                                3. Click Next. The Map Field page is displayed. CDM automatically matches the source and destination fields, as shown in Figure 2.

                                  • If the field mapping is incorrect, you can drag the fields to adjust the mapping.
                                  • The expressions in CDM support field conversion of common character strings, dates, and values.
                                  +
                                  Figure 2 Table-to-table field mapping

                                4. Click Next and set task parameters. Generally, retain the default values of all parameters.

                                  In this step, you can configure the following optional functions:
                                  • Retry Upon Failure: If the job fails to be executed, you can determine whether to automatically retry. Retain the default value Never.
                                  • Group: Select the group to which the job belongs. The default group is DEFAULT. On the Job Management page, jobs can be displayed, started, or exported by group.
                                  • Schedule Execution: Enable it if you need to configure scheduled jobs. Retain the default value No.
                                  • Concurrent Extractors: Enter the number of extractors to be concurrently executed. You can increase the value of this parameter to improve migration efficiency.
                                  • Write Dirty Data: Dirty data may be generated during data migration between tables. You are advised to select Yes.
                                  • Delete Job After Completion: Retain the default value Do not delete.

                                5. Click Save and Run. The Job Management page is displayed, on which you can view the job execution progress and result.
                                6. After the job is successfully executed, in the Operation column of the job, click Historical Record to view the job's historical execution records and read/write statistics.

                                  On the Historical Record page, click Log to view the job logs.

                                  @@ -195,3 +194,10 @@
                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0103.html b/docs/dataartsstudio/umn/dataartsstudio_01_0103.html index 729d58a47..07de4a0e0 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0103.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0103.html @@ -13,13 +13,13 @@

                              -

                              Creating an MRS HDFS Link

                              1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.

                                Figure 1 Selecting a connector type
                                +

                                Creating an MRS HDFS Link

                                1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.

                                  Figure 1 Selecting a connector type

                                2. Select MRS HDFS and click Next to configure parameters for the MRS HDFS link.

                                  • Name: Enter a custom link name, for example, mrs_hdfs_link.
                                  • Manager IP: IP address of MRS Manager. Click Select next to the Manager IP text box to select a created MRS cluster. CDM automatically fills in the authentication information.
                                  • Username: If Authentication Method is set to KERBEROS, set the username and password for logging in to MRS Manager.

                                    If you need to create a snapshot when exporting a directory from HDFS, the user configured here must have the administrator permission on HDFS.

                                  • Password: password for logging in to MRS Manager
                                  • Authentication Method: authentication method for accessing MRS
                                  • Run Mode: Select the running mode of the HDFS link.

                                -

                                Creating an OBS Link

                                1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                                  Figure 2 Selecting a connector type
                                  -

                                2. Select Object Storage Service (OBS) and click Next to configure parameters for the OBS link.

                                  • Name: Enter a custom link name, for example, obslink.
                                  • OBS Server and Port: Enter the actual OBS address information.
                                  • AK and SK: Enter the AK and SK used for logging in to OBS.
                                    To obtain an access key, perform the following steps:
                                    1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                    2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 3.
                                      Figure 3 Clicking Create Access Key
                                      +

                                      Creating an OBS Link

                                      1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.

                                        Figure 2 Selecting a connector type
                                        +

                                      2. Select Object Storage Service (OBS) and click Next to configure parameters for the OBS link.

                                        • Name: Enter a custom link name, for example, obslink.
                                        • OBS Server and Port: Enter the actual OBS address information.
                                        • AK and SK: Enter the AK and SK used for logging in to OBS.
                                          To obtain an access key, perform the following steps:
                                          1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                          2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 3.
                                            Figure 3 Clicking Create Access Key
                                          3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                                            • Only two access keys can be added for each user.
                                            • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
                                          @@ -27,7 +27,7 @@

                                      3. Click Save. The Link Management page is displayed.
                                      -

                                      Creating a Migration Job

                                      1. Choose Table/File Migration > Create Job to create a job for exporting data from the MRS HDFS database to OBS.

                                        Figure 4 Creating a job for migrating data from MRS HDFS to OBS
                                        +

                                        Creating a Migration Job

                                        1. Choose Table/File Migration > Create Job to create a job for exporting data from the MRS HDFS database to OBS.

                                          Figure 4 Creating a job for migrating data from MRS HDFS to OBS
                                          • Job Name: Enter a unique name.
                                          • Source Job Configuration
                                            • Source Link Name: Select the hdfs_llink created in Creating an MRS HDFS Link.
                                            • Source Directory/File: Enter the directory or file path of the data to be migrated.
                                            • File Format: Select the file format used for data transmission. Select Binary. If files are transferred without being parsed, the file format does not have to be Binary. This applies to file copy.
                                            • Retain the default values of other optional parameters.
                                          • Destination Job Configuration
                                            • Destination Link Name: Select the obs_link created in Creating an OBS Link.
                                            • Bucket Name: Select the bucket from which the data will be migrated.
                                            • Write Directory: Enter the directory to which data is to be written on the OBS server.
                                            • File Format: Select Binary.
                                            • Retain the default values of the optional parameters in Show Advanced Attributes.
                                          @@ -44,3 +44,10 @@
                                      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0104.html b/docs/dataartsstudio/umn/dataartsstudio_01_0104.html index 7d9a3cd6b..67aa75b48 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0104.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0104.html @@ -1,15 +1,16 @@

                                      Configuring Field Converters

                                      -

                                      Scenario

                                      • After the job parameters are configured, field mapping needs to be configured. You can click in the Operation column to create a field converter.
                                      • If files are migrated between FTP, SFTP, OBS, and HDFS and the migration source's File Format is set to Binary, files will be directly transferred, free from field mapping.
                                      +

                                      Scenario

                                      • After the job parameters are configured, field mapping needs to be configured. You can click in the Operation column to create a field converter.
                                      • If files are migrated between FTP, SFTP, OBS, and HDFS and the migration source's File Format is set to Binary, files will be directly transferred, free from field mapping.
                                      -
                                      You can create a field converter on the Map Field page when creating a table/file migration job.
                                      Figure 1 Creating a field converter
                                      +
                                      You can create a field converter on the Map Field page when creating a table/file migration job.
                                      Figure 1 Creating a field converter

                                      CDM can convert fields during migration. Currently, the following field converters are supported:

                                      -

                                      Constraints

                                      • If Use SQL Statement is set to Yes in the source job configuration, converters cannot be created.
                                      • On the Map Field tab page, if CDM fails to obtain all columns by obtaining sample values (for example, when data is exported from HBase, CloudTable, or MongoDB, there is a high probability that CDM failed to obtain all columns), you can click and select Add a new field to add new fields to ensure that the data imported to the migration destination is complete.
                                      • When a relational database, Hive, DLI, or MRS Hudi is used as the migration source, sample values cannot be obtained.
                                      • When SQLServer is the destination, fields of the timestamp type cannot be written. You must change their type (for example, to datetime) so that they can be written.
                                      • Column names are displayed when the source of the migration job is OBS, CSV files are to be migrated, and parameter Extract first row as columns is set to Yes.
                                      • Field converters configuration is not involved when the binary format is used to migrate files to files.
                                      • In the automatic table creation scenario, you need to manually add fields to the destination table in advance and then add fields to the field mapping.
                                      • After a field is added, its sample value is not displayed on the console. This does not affect the field value transmission. CDM directly writes the field value to the destination end.
                                      • If the field mapping is incorrect, you can adjust the field mapping by dragging fields or clicking to map fields in batches.
                                      • An expression processes the data of a field. When creating an expression converter, you are not advised to use a time macro. If you need to use a time macro, use either of the following methods (if the source is of the file type, only Method 1 is supported):
                                        • Method 1: When creating an expression converter, use two single quotation marks ('') to enclose the expression.

                                          For example, if expression ${dateformat(yyyy-MM-dd)} is not enclosed in quotation marks, the hyphen (-) in the value 2017-10-16 parsed from the expression will be recognized as a minus sign, and further calculation will be performed to generate result 1991, which is incorrect. If you enclose the expression in quotation marks, that is, '${dateformat(yyyy-MM-dd)}', you will obtain '2017-10-16', which is correct.

                                          -

                                          -
                                        • Method 2: Add a custom source field, enter a macro variable of date and time for Example Value, and map the field to a destination field again.

                                          +

                                          Constraints

                                          • If Use SQL Statement is set to Yes in the source job configuration, converters cannot be created.
                                          • On the Map Field tab page, if CDM fails to obtain all columns by obtaining sample values (for example, when data is exported from HBase, CloudTable, or MongoDB, there is a high probability that CDM failed to obtain all columns), you can click and select Add a new field to add new fields to ensure that the data imported to the migration destination is complete.
                                          • When a relational database, Hive, DLI, or MRS Hudi is used as the migration source, sample values cannot be obtained.
                                          • When SQLServer is the destination, fields of the timestamp type cannot be written. You must change their type (for example, to datetime) so that they can be written.
                                          • Column names are displayed when the source of the migration job is OBS, CSV files are to be migrated, and parameter Extract first row as columns is set to Yes.
                                          • Field converters configuration is not involved when the binary format is used to migrate files to files.
                                          • In the automatic table creation scenario, you need to manually add fields to the destination table in advance and then add fields to the field mapping.
                                          • After a field is added, its sample value is not displayed on the console. This does not affect the field value transmission. CDM directly writes the field value to the destination end.
                                          • If the field mapping is incorrect, you can adjust the field mapping by dragging fields or clicking to map fields in batches.
                                          • An expression processes the data of a field. When you create an expression converter, do not use a time macro. If you need to use a time macro, use either of the following methods (if the source is of the file type, only Method 1 is supported):
                                            • Method 1: When creating an expression converter, use two single quotation marks ('') to enclose the expression.

                                              For example, if expression ${dateformat(yyyy-MM-dd)} is not enclosed in quotation marks, the hyphen (-) in the value 2017-10-16 parsed from the expression will be recognized as a minus sign, and further calculation will be performed to generate result 1991, which is incorrect. If you enclose the expression in quotation marks, that is, '${dateformat(yyyy-MM-dd)}', you will obtain '2017-10-16', which is correct.

                                              +
                                              Figure 2 Using two single quotation marks ('') to enclose an expression
                                              +

                                              +
                                            • Method 2: Add a custom source field, enter a macro variable of date and time for Example Value, and map the field to a destination field again.
                                              Figure 3 Adding a custom source field
                                          • If the data is imported to GaussDB(DWS), you need to select the distribution columns in the destination fields. You are advised to select the distribution columns according to the following rules:
                                            1. Use the primary key as the distribution column.
                                            2. If multiple data segments are combined as primary keys, specify all primary keys as the distribution column.
                                            3. In the scenario where no primary key is available, if no distribution column is selected, DWS uses the first column as the distribution column by default. As a result, data skew risks exist.
                                          @@ -25,12 +26,13 @@

                                          Remove line break

                                          This converter is used to delete the newline characters, such as \n, \r, and \r\n from the field.

                                          -

                                          Expression Conversion

                                          This converter uses the JSP expression language (EL) to convert the current field or a row of data. The JSP EL is used to create arithmetic and logical expressions. Within a JSP EL expression, you can use integers, floating point numbers, strings, the built-in constants true and false for boolean values, and null.

                                          +

                                          Expression Conversion

                                          This converter uses the JSP expression language (EL) to convert the current field or a row of data. The JSP EL is used to create arithmetic and logical expressions. In an expression, you can use integers, floating point numbers, strings, constants true and false, and null.

                                          +

                                          During data conversion, if the content to be replaced contains a special character, use a backslash (\) to escape the special character to a common one.

                                          • The expression supports the following environment variables:
                                            • value: indicates the current field value.
                                            • row: indicates the current row, which is an array type.
                                          • The expression supports the following Utils:
                                            1. If the field is of the string type, convert all character strings into lowercase letters, for example, convert aBC to abc.

                                              Expression: StringUtils.lowerCase(value)

                                            2. Convert all character strings of the current field to uppercase letters.

                                              Expression: StringUtils.upperCase(value)

                                            3. Convert the format of the first date field from 2018-01-05 15:15:05 to 20180105.

                                              Expression: DateUtils.format(DateUtils.parseDate(row[0],"yyyy-MM-dd HH:mm:ss"),"yyyyMMdd")

                                              -
                                            4. Convert a timestamp to a date string in yyyy-MM-dd hh:mm:ss format, for example, convert 1701312046588 to 2023-11-30 10:40:46.

                                              Expression: DateUtils.format(NumberUtils.toLong(value),"yyyy-MM-dd HH:mm:ss")

                                              +
                                            5. Convert a timestamp to a date string in yyyy-MM-dd hh:mm:ss format, for example, convert 1701312046588 to 2023-11-30 10:40:46.

                                              Expression: DateUtils.format(NumberUtils.toLong(value),"yyyy-MM-dd HH:mm:ss")

                                            6. Convert a date string in the yyyy-MM-dd hh:mm:ss format to a timestamp.

                                              Expression: DateUtils.getTime(DateUtils.parseDate(value,"yyyy-MM-dd hh:mm:ss"))

                                            7. If the field value is a date string in yyyy-MM-dd format, extract the year from the field value, for example, extract 2017 from 2017-12-01.

                                              Expression: StringUtils.substringBefore(value,"-")

                                            8. If the field value is of the numeric type, convert the value to a new value which is two times greater than the original value:

                                              Expression: value*2

                                              @@ -69,12 +71,13 @@
                                            9. If the field is of the string type, remove the substring at the end of the field. If the specified substring is not at the end of the field, no conversion is performed. For example, remove .com at the end of www.domain.com.

                                              Expression: StringUtils.removeEnd(value,".com")

                                            10. If the field is of the string type, delete the substring at the beginning of the field. If the specified substring is not at the beginning of the field, no conversion is performed. For example, delete www. at the beginning of www.domain.com.

                                              Expression: StringUtils.removeStart(value,"www.")

                                            11. If the field is of the string type, replace all the specified character strings in the field. For example, replace a in aba with z to obtain zbz.

                                              Expression: StringUtils.replace(value,"a","z")

                                              +

                                              If the content to be replaced contains a special character, the special character must be escaped to a common character. For example, if you want to delete \t from a string, use the following expression: StringUtils.replace(value,"\\t",""), which means escaping the backslash (\) again.

                                            12. If the field is of the string type, replace multiple characters in the character string at a time. For example, replace h in hello with j and o with y to obtain jelly.

                                              Expression: StringUtils.replaceChars(value,"ho","jy")

                                            13. If the string starts with the specified prefix (case sensitive), true is returned; otherwise, false is returned. For example, abcdef starts with abc, so that true is returned.

                                              Expression: StringUtils.startsWith(value,"abc")

                                            14. If the field is of the string type, delete all the specified characters at the beginning and end of the field. the field. For example, delete all x, y, z, and b from abcyx to obtain abc.

                                              Expression: StringUtils.strip(value,"xyzb")

                                              -
                                            15. If the field is of the string type, delete all the specified characters at the end of the field, for example, delete the abc string at the end of the field.

                                              Expression: StringUtils.stripEnd(value,"abc")

                                              +
                                            16. If the field is of the string type, delete all the specified characters at the end of the field, for example, delete the "abc" string at the end of the field.

                                              Expression: StringUtils.stripEnd(value,"abc")

                                            17. If the field is of the string type, delete all the specified characters at the beginning of the field, for example, delete all spaces at the beginning of the field.

                                              Expression: StringUtils.stripStart(value,null)

                                              -
                                            18. If the field is of the string type, obtain the substring after the specified position (the index starts from 0, including the character at the specified position) of the character string. If the specified position is a negative number, calculate the position in the descending order. The first digit at the end is -1. For example, obtain the second character (c) of abcde and the string after it, that is, cde.

                                              Expression: StringUtils.substring(value,2)

                                              +
                                            19. If the field is of the string type, obtain the substring after the specified position (the index starts from 0, including the character at the specified position) of the character string. If the specified position is a negative number, calculate the position in the descending order. The first digit at the end is -1. For example, obtain the character whose index is 2 from abcde (that is, c) and the string after it, that is, cde.

                                              Expression: StringUtils.substring(value,2)

                                            20. If the field is of the string type, obtain the substring in a specified range (the index starts from 0, including the character at the start and excluding the character at the end). If the range is a negative number, calculate the position in the descending order. The first digit at the end is -1. For example, obtain the string between the second character (c) and fourth character (e) of abcde, that is, cd.

                                              Expression: StringUtils.substring(value,2,4)

                                            21. If the field is of the string type, obtain the substring after the first specified character. For example, obtain the substring after the first b in abcba, that is, cba.

                                              Expression: StringUtils.substringAfter(value,"b")

                                            22. If the field is of the string type, obtain the substring after the last specified character. For example, obtain the substring after the last b in abcba, that is, a.

                                              Expression: StringUtils.substringAfterLast(value,"b")

                                              @@ -94,13 +97,13 @@
                                            23. Convert the character string to a value of the long type. If the conversion fails, the specified value, for example, 1L, is returned.

                                              Expression: NumberUtils.toLong(value,1L)

                                            24. Convert the character string to a value of the short type. If the conversion fails, 0 is returned.

                                              Expression: NumberUtils.toShort(value)

                                            25. Convert the character string to a value of the short type. If the conversion fails, the specified value, for example, 1, is returned.

                                              Expression: NumberUtils.toShort(value,1)

                                              -
                                            26. Convert the IP string to a value of the long type, for example, convert 10.78.124.0 to 172915712.

                                              Expression: CommonUtils.ipToLong(value)

                                              +
                                            27. Convert the IP string to a value of the long type, for example, convert 10.78.124.0 to 172915712.

                                              Expression: CommonUtils.ipToLong(value)

                                            28. Read an IP address and physical address mapping file from the network, and download the mapping file to the map collection. url indicates the address for storing the IP mapping file, for example, http://10.114.205.45:21203/sqoop/IpList.csv.

                                              Expression: HttpsUtils.downloadMap("url")

                                            29. Cache the IP address and physical address mappings and specify a key for retrieval, for example, ipList.

                                              Expression: CommonUtils.setCache("ipList",HttpsUtils.downloadMap("url"))

                                            30. Obtain the cached IP address and physical address mappings.

                                              Expression: CommonUtils.getCache("ipList")

                                            31. Check whether the IP address and physical address mappings are cached.

                                              Expression: CommonUtils.cacheExists("ipList")

                                            32. Based on the specified offset type (month/day/hour/minute/second) and offset (positive number indicates increase and negative number indicates decrease), convert the time in the specified format to a new time, for example, add 8 hours to 2019-05-21 12:00:00.

                                              Expression: DateUtils.getCurrentTimeByZone("yyyy-MM-dd HH:mm:ss",value, "hour", 8)

                                              -
                                            33. If the value is empty or null, "aaa" is returned. Otherwise, value is returned.

                                              Expression: StringUtils.defaultIfEmpty(value,"aaa")

                                              +
                                            34. If the value is empty or null, "aaa" is returned. Otherwise, value is returned.

                                              Expression: StringUtils.defaultIfEmpty(value,"aaa")

                                          @@ -111,3 +114,10 @@
                                      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0107.html b/docs/dataartsstudio/umn/dataartsstudio_01_0107.html new file mode 100644 index 000000000..67ff117ba --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0107.html @@ -0,0 +1,23 @@ + + +

                                      (Optional) Defining a Workspace Role

                                      +

                                      For IAM users with DARTS User account permissions, DataArts Studio workspace roles determine their permissions in workspaces. Preset roles include admin, developer, deployer, operator, and viewer. For details about the permissions of each role, see "Permissions" in Service Overview.

                                      +

                                      If the preset roles meet your needs, skip this section. Otherwise, create custom roles by following the instructions in this section.

                                      +

                                      Context

                                      • DARTS Administrator or Tenant Administrator can create custom roles in a workspace.
                                      +
                                      +

                                      Notes and Constraints

                                      • Due to the constraints of the authentication cache mechanism, when the permissions of a custom role change, permissions of the members of the workspace that this role has been associated with will not be updated immediately. Instead, the updated permissions take effect six minutes after the workspace members with this role stop accessing the DataArts Studio console.
                                      • A custom role with the same permissions as the workspace admin cannot perform some operations that can only be performed by the admin.
                                      +
                                      +

                                      Procedure

                                      1. Log in to the DataArts Studio console as user DARTS Administrator or Tenant Administrator. For details, see Accessing the DataArts Studio Instance Console.
                                      2. On the Roles page, click Create. In the displayed dialog box, set the following parameters:

                                        • Role Name: unique identifier of a custom role. You are advised to name the role to fit its application scenario and avoid any meaningless description.
                                        • Role Description: description of the role, for example, the key permission differences between the role and preset roles
                                        • Role Type: Select a proper type based on where this role will be used. Role permissions differ in the simple and enterprise mode. For details about the enterprise mode, see DataArts Studio Enterprise Mode Overview.
                                          • If you want to use this role in a workspace in simple mode, select DEV&PROD_CUSTOM.
                                          • If you want to use this role in the development environment of a workspace in enterprise mode, select DEV_CUSTOM.
                                          • If you want to use this role in the production environment of a workspace in enterprise mode, select PROD_CUSTOM.
                                          +
                                        • Reuse: Use this function if you only need to slightly adjust the permissions of the preset roles to meet your requirements. Otherwise, you can directly select permissions for the role.

                                          When you create or edit a role, an error message indicating insufficient permissions may be displayed even if you have the DARTS Administrator or Tenant Administrator permissions. This may be caused by network constraints. You can change another network and try again.

                                          +
                                          +
                                        +

                                        +

                                      3. After configuring the role name, type, and permissions, click OK.
                                      4. Assign the created custom role to the IAM user by following the instructions in Adding Workspace Members and Assigning Roles.
                                      +
                                      +
                                      + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0108.html b/docs/dataartsstudio/umn/dataartsstudio_01_0108.html index 6bd10fdfb..6fc87c3b2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0108.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0108.html @@ -58,15 +58,15 @@
                                    3. Field Delimiter

                                      Character used to separate columns in a CSV file. The value can be a single character, multiple characters, or special characters. For details, see Table 1.

                                    4. Encoding Type

                                      Encoding type of a CSV file. The default value is UTF-8.

                                      If this parameter is specified at the migration source, the specified encoding type is used to parse the file. If this parameter is specified at the migration destination, the specified encoding type is used to write data to the file.

                                      -
                                    5. Use Quote Character
                                      • Exporting data from a database or NoSQL to CSV files (configuring Use Quote Character at the migration destination): If a field delimiter appears in the character string of a column of data at the migration source, set Use Quote Character to Yes at the migration destination to quote the character string as a whole and write it into the CSV file. Currently, CDM uses double quotation marks ("") as the quote character only. Figure 1 shows that the value of the name field in the database contains a comma (,).
                                        Figure 1 Field value containing the field delimiter
                                        +
                                      • Use Quote Character
                                        • Exporting data from a database or NoSQL to CSV files (configuring Use Quote Character at the migration destination): If a field delimiter appears in the character string of a column of data at the migration source, set Use Quote Character to Yes at the migration destination to quote the character string as a whole and write it into the CSV file. Currently, CDM uses double quotation marks ("") as the quote character only. Figure 1 shows that the value of the name field in the database contains a comma (,).
                                          Figure 1 Field value containing the field delimiter

                                          If you do not use the quote character, the exported CSV file is displayed as follows:

                                          -
                                          3.hello,world,abc
                                          +
                                          3,hello,world,abc

                                          If you use the quote character, the exported CSV file is displayed as follows:

                                          3,"hello,world",abc

                                          If the data in the database contains double quotation marks ("") and you set Use Quote Character to Yes, the quote character in the exported CSV file is displayed as three double quotation marks ("""). For example, if the value of a field is a"hello,world"c, the exported data is as follows:

                                          """a"hello,world"c"""
                                          -
                                        • Exporting CSV files to a database or NoSQL (configuring Use Quote Character at the migration source): If you want to import the CSV files with quoted values to a database correctly, set Use Quote Character to Yes at the migration source to write the quoted values as a whole.
                                        -
                                      • Use RE to Separate Fields

                                        This function is used to parse complex semi-structured text, such as log files. For details, see Using Regular Expressions to Separate Semi-structured Text.

                                        +
                                      • Exporting CSV files to a database or NoSQL (configuring Use Quote Character at the migration source): If you want to import the CSV files with quoted values to a database correctly, set Use Quote Character to Yes at the migration source to write the quoted values as a whole.
                                      +
                                    6. Use RE to Separate Fields

                                      This function is used to parse complex semi-structured text, such as log files. For details, see Using Regular Expressions to Separate Semi-structured Text.

                                    7. Use First Row as Header

                                      This parameter is used when CSV files are exported to other locations. If this parameter is specified at the migration source, CDM uses the first row as the header when extracting data. When the CSV files are transferred, the headers are skipped. The number of rows extracted from the migration source is more than the number of rows written to the migration destination. The log files will output the information that the header is skipped during the migration.

                                    8. File Size

                                      This parameter is used when data is exported from the database to a CSV file. If a table contains a large amount of data, a large CSV file is generated after migration, which is inconvenient to download or view. In this case, you can specify this parameter at the migration destination so that multiple CSV files with the specified size can be generated. The value of this parameter is an integer. The unit is MB.

                                    @@ -107,7 +107,7 @@ }]
                                3. JSON Reference Node

                                  Root node that records data. The data corresponding to the node is a JSON array. CDM extracts data from the array in the same mode. Use periods (.) to separate multi-layer nested JSON nodes.

                                  -
                                4. Copying Data from a JSON File
                                  1. Example 1: Extract data from multiple objects that are separated or merged. A JSON file contains multiple JSON objects. The following gives an example:
                                     {
                                    +
                                  2. Copying Data from a JSON File
                                    1. Example 1
                                      Extract data from multiple objects that are separated or merged. A JSON file contains multiple JSON objects. The following gives an example:
                                       {
                                           "took": 190,
                                           "timed_out": false,
                                           "total": 1000001,
                                      @@ -125,49 +125,50 @@
                                           "total": 1000003,
                                           "max_score": 1.0
                                        }
                                      +
                                      To extract data from the JSON object and write data to the database in the following formats, set File Format to JSON and JSON Type to JSON object, and then map fields. -
                              Table 1 MySQL link parameters

                              Parameter

                              Description

                              +

                              Description

                              Example Value

                              +

                              Example Value

                              Name

                              +

                              Name

                              Unique link name

                              +

                              Unique link name

                              mysqllink

                              +

                              mysqllink

                              Database Server

                              +

                              Database Server

                              IP address or domain name of the MySQL database server

                              +

                              IP address or domain name of the MySQL database server

                              -

                              +

                              -

                              Port

                              +

                              Port

                              MySQL database port

                              +

                              MySQL database port

                              3306

                              +

                              3306

                              Database Name

                              +

                              Database Name

                              Name of the MySQL database

                              +

                              Name of the MySQL database

                              sqoop

                              +

                              sqoop

                              Username

                              +

                              Username

                              User who has the read, write, and delete permissions on the MySQL database

                              +

                              User who has the read, write, and delete permissions on the MySQL database

                              admin

                              +

                              admin

                              Password

                              +

                              Password

                              Password of the user

                              +

                              Password of the user

                              -

                              +

                              -

                              Use Local API

                              +

                              Use Local API

                              Whether to use the local API of the database for acceleration. (The system attempts to enable the local_infile system variable of the MySQL database.)

                              +

                              Whether to use the local API of the database for acceleration. (The system attempts to enable the local_infile system variable of the MySQL database.)

                              Yes

                              +

                              Yes

                              Use Agent

                              +

                              Use Agent

                              Whether to extract data from the data source through an agent

                              +

                              The agent function will be unavailable soon and does not need to be configured.

                              No

                              +

                              -

                              local_infile Character Set

                              +

                              local_infile Character Set

                              When using local_infile to import data to MySQL, you can configure the encoding format.

                              +

                              When using local_infile to import data to MySQL, you can configure the encoding format.

                              utf8

                              +

                              utf8

                              Driver Version

                              +

                              Driver Version

                              Before connecting CDM to a relational database, you need to upload the JDK 8 .jar driver of the relational database. Download the MySQL driver 5.1.48 from https://downloads.mysql.com/archives/c-j/, obtain mysql-connector-java-5.1.48.jar, and upload it.

                              +

                              Before connecting CDM to a relational database, you need to upload the JDK 8 .jar driver of the relational database. Download the MySQL driver 5.1.48 from https://downloads.mysql.com/archives/c-j/, obtain mysql-connector-java-5.1.48.jar, and upload it.

                              -

                              +

                              -

                              Use Agent

                              Whether to extract data from the data source through an agent

                              +

                              The agent function will be unavailable soon and does not need to be configured.

                              Yes

                              +

                              -

                              Agent

                              Click Select and select the created agent.

                              +

                              The agent function will be unavailable soon and does not need to be configured.

                              -

                              - @@ -34,9 +37,12 @@ @@ -60,7 +66,12 @@ - - - - - + + + @@ -125,6 +143,20 @@ + + + + + +

                              took

                              +
                              - - - - - - - - - - - - - - -
                              Table 2 Example

                              took

                              timedOut

                              +

                              timedOut

                              total

                              +

                              total

                              maxScore

                              +

                              maxScore

                              190

                              +

                              190

                              false

                              +

                              false

                              1000001

                              +

                              1000001

                              1.0

                              +

                              1.0

                              191

                              +

                              191

                              false

                              +

                              false

                              1000002

                              +

                              1000002

                              1.0

                              +

                              1.0

                              192

                              +

                              192

                              false

                              +

                              false

                              1000003

                              +

                              1000003

                              1.0

                              +

                              1.0

                              -
                            5. Example 2: Extract data from the reference node. A JSON file contains a single JSON object, but the valid data is on a data node. The following gives an example:
                              {
                              +
                            6. Example 2
                              Extract data from the reference node. A JSON file contains a single JSON object, but the valid data is on a data node. The following gives an example:
                              {
                                   "took": 190,
                                   "timed_out": false,
                                   "hits": {
                              @@ -197,41 +198,42 @@
                                        }]
                                    }
                                }
                              +
                              To write data to the database in the following formats, set File Format to JSON, JSON Type to JSON object, and JSON Reference Node to hits.hits, and then map fields. -
                              @@ -92,7 +92,7 @@ + + + +

                              ID

                              +
                              - - - - - - - - - - -
                              Table 3 Example

                              ID

                              SourceName

                              +

                              SourceName

                              SourceBooks

                              +

                              SourceBooks

                              650612

                              +

                              650612

                              tom

                              +

                              tom

                              ["book1","book2","book3"]

                              +

                              ["book1","book2","book3"]

                              650616

                              +

                              650616

                              tom

                              +

                              tom

                              ["book1","book2","book3"]

                              +

                              ["book1","book2","book3"]

                              650618

                              +

                              650618

                              tom

                              +

                              tom

                              ["book1","book2","book3"]

                              +

                              ["book1","book2","book3"]

                              -
                            7. Example 3: Extract data from the JSON array. A JSON file is a JSON array consisting of multiple JSON objects. The following gives an example:
                              [{
                              +
                            8. Example 3
                              Extract data from the JSON array. A JSON file is a JSON array consisting of multiple JSON objects. The following gives an example:
                              [{
                                     "took" : 190,
                                     "timed_out" : false,
                                     "total" : 1000001,
                              @@ -243,83 +245,85 @@
                                     "total" : 1000002,
                                     "max_score" : 1.0
                                 }]
                              +

                              To write data to the database in the following formats, set File Format to JSON and JSON Type to JSON array, and then map fields.

                              -
                              + + + +

                              took

                              +
                              - - - - - - - - - - -
                              Table 4 Example

                              took

                              timedOut

                              +

                              timedOut

                              total

                              +

                              total

                              maxScore

                              +

                              maxScore

                              190

                              +

                              190

                              false

                              +

                              false

                              1000001

                              +

                              1000001

                              1.0

                              +

                              1.0

                              191

                              +

                              191

                              false

                              +

                              false

                              1000002

                              +

                              1000002

                              1.0

                              +

                              1.0

                              -
                            9. Example 4: Configure a converter when parsing the JSON file. On the premise of example 2, to add the hits.max_score field to all records, that is, to write the data to the database in the following formats, perform the following operations: -
                              - - - - - - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0465.html b/docs/dataartsstudio/umn/dataartsstudio_01_0465.html index e02a53826..d559677ff 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0465.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0465.html @@ -1,7 +1,7 @@

                              Open/Close Resource

                              -

                              Functions

                              You can use the Open/Close Resource node to enable or disable cloud services as required.

                              +

                              Functions

                              You can use the Open/Close Resource node to enable or disable services as required.

                              Parameters

                              Table 1 and Table 2 describe the parameters of the Open/Close Resource node.

                              @@ -97,6 +97,13 @@
                              + + + +

                              ID

                              +
                            10. Example 4
                              Configure a converter when parsing the JSON file. On the premise of example 2, to add the hits.max_score field to all records, that is, to write the data to the database in the following formats, perform the following operations: +
                              - - - - - - - - - - - - - - -
                              Table 5 Example

                              ID

                              SourceName

                              +

                              SourceName

                              SourceBooks

                              +

                              SourceBooks

                              MaxScore

                              +

                              MaxScore

                              650612

                              +

                              650612

                              tom

                              +

                              tom

                              ["book1","book2","book3"]

                              +

                              ["book1","book2","book3"]

                              1.0

                              +

                              1.0

                              650616

                              +

                              650616

                              tom

                              +

                              tom

                              ["book1","book2","book3"]

                              +

                              ["book1","book2","book3"]

                              1.0

                              +

                              1.0

                              650618

                              +

                              650618

                              tom

                              +

                              tom

                              ["book1","book2","book3"]

                              +

                              ["book1","book2","book3"]

                              1.0

                              +

                              1.0

                              -
                              Set File Format to JSON, JSON Type to JSON object, and JSON Reference Node to hits.hits, and then create a converter.
                              1. Click to add a field.
                                Figure 2 Adding a field
                                -
                              2. Click to create a converter for the new field.
                                Figure 3 Creating a field converter
                                -
                              3. Set Converter to Expression conversion, enter "1.0" in the Expression text box, and click Save.
                                Figure 4 Configuring a field converter
                                +
                              +
                              Set File Format to JSON, JSON Type to JSON object, and JSON Reference Node to hits.hits, and then create a converter.
                              1. Click to add a field.
                                Figure 2 Adding a field
                                +
                              2. Click to create a converter for the new field.
                                Figure 3 Creating a field converter
                                +
                              3. Set Converter to Expression conversion, enter "1.0" in the Expression text box, and click Save.
                                Figure 4 Configuring a field converter
                            11. @@ -337,19 +341,18 @@

                              In addition, you can set the suspension period. Within the suspension period, CDM periodically queries whether the marker file exists. If the file does not exist after the suspension period expires, the job fails.

                              The marker file will not be migrated.

                            12. Job Success Marker File

                              After data is successfully migrated to a file system, an empty file is generated in the destination directory. You can specify the file name. Generally, this parameter is used together with Start Job by Marker File.

                              -

                              Note that the file cannot be confused with the file to be transferred. For example, if the file to be transferred is finish.txt and the job success marker file is set to finish.txt, the two files will overwrite each other.

                              +

                              The name of the job success marker file cannot be the same as that of the transferred file, for example, finish.txt. If the two files have the same name, they will overwrite each other.

                            13. Filter

                              When using CDM to migrate files, you can specify a filter to filter files. Files can be filtered by wildcard character or time filter.

                              • If you select Wildcard, CDM migrates only the paths or files that meet the filter condition.
                              • If you select Time Filter, CDM migrates only the files modified after the specified time point.
                              -

                              For example, the /table/ directory stores a large number of data table directories divided by day. DRIVING_BEHAVIOR_20180101 to DRIVING_BEHAVIOR_20180630 store all data of DRIVING_BEHAVIOR from January to June. To migrate only the table data of DRIVING_BEHAVIOR in March, set Source Directory/File to /table, Filter Type to Wildcard, and Path Filter to DRIVING_BEHAVIOR_201803*.

                              +

                              For example, the /table/ directory stores a large number of data table directories divided by day. DRIVING_BEHAVIOR_20180101 to DRIVING_BEHAVIOR_20180630 store all data of DRIVING_BEHAVIOR from January to June. If you only want to migrate the table data of DRIVING_BEHAVIOR in March, set the source directory to /table, filter type to wildcard, and path filter to DRIVING_BEHAVIOR_201803*.

                            14. Solutions to File Format Problems

                              1. When data in a database is exported to a CSV file, if the data contains commas (,), the data in the exported CSV file is disordered.

                                The following solutions are available:

                                -
                                1. Specify a field delimiter.

                                  Use a character that does not exist in the database or a rare non-printable character as the field delimiter. For example, set Field Delimiter at the migration destination to %01. In this way, the exported field delimiter is \u0001. For details, see Table 1.

                                  -
                                2. Use the quote character.

                                  Set Use Quote Character to Yes at the migration destination. In this way, if the field in the database contains the field delimiter, CDM quotes the field using the quote character and write the field as a whole to the CSV file.

                                  -
                                -
                              2. The data in the database contains line separators.

                                Scenario: When you use CDM to export a table in the MySQL database (a field value contains the line separator \n) to a CSV file, and then use CDM to import the exported CSV file to MRS HBase, data in the exported CSV file is truncated.

                                -

                                Solution: Specify a line separator.

                                -

                                When you use CDM to export MySQL table data to a CSV file, set Line Separator at the migration destination to %01 (ensure that the value does not appear in the field value). In this way, the line separator in the exported CSV file is %01. Then use CDM to import the CSV file to MRS HBase. Set Line Separator at the migration source to %01. This avoids data truncation.

                                +
                                • Specify a field delimiter.

                                  Use a character that does not exist in the database or a rare non-printable character as the field delimiter. For example, you can set Field Delimiter at the destination to %01. In this way, the exported field delimiter is \u0001. For details, see Table 1.

                                  +
                                • Use a quote character.

                                  Set Use Quote Character to Yes at the migration destination. In this way, if the field in the database contains the field delimiter, CDM quotes the field using the quote character and write the field as a whole to the CSV file.

                                  +
                                +
                              3. The data in the database contains line separators.
                                • Scenario: When you use CDM to export a table in the MySQL database (a field value contains the line separator \n) to a CSV file, and then use CDM to import the exported CSV file to MRS HBase, data in the exported CSV file is truncated.
                                • Solution: Specify a line separator.

                                  When you use CDM to export MySQL table data to a CSV file, set Line Separator at the migration destination to %01 (ensure that the value does not appear in the field value). In this way, the line separator in the exported CSV file is %01. Then use CDM to import the CSV file to MRS HBase. Set Line Separator at the migration source to %01. This avoids data truncation.

                                  +
                              @@ -359,3 +362,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0109.html b/docs/dataartsstudio/umn/dataartsstudio_01_0109.html index b9eaba701..80ba9c77f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0109.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0109.html @@ -4,9 +4,9 @@

                              When you create a job on the CDM console to migrate tables or files of a relational database, you can add a field to record the time when they were written to the database.

                              Prerequisites

                              • A link has been created, and the source end of the connector is a relational database.
                              • The destination data table contains a date and time field or timestamp field. In the automatic table creation scenario, you need to manually create the date and time field or timestamp field in the destination table in advance.
                              -

                              Creating a Table/File Migration Job

                              1. Create a table/file migration job, and select the created source connector and destination connector.
                              2. Click Next to go to the Map Field page and click .

                                Figure 1 Configuring field mapping
                                +

                                Creating a Table/File Migration Job

                                1. Create a table/file migration job, and select the created source connector and destination connector.
                                2. Click Next to go to the Map Field page and click .

                                  Figure 1 Configuring field mapping

                                3. Click the Custom Fields tab, set the field name and value, and click OK.

                                  Name: Enter InputTime.

                                  -
                                  Value: Enter ${timestamp()}. For more time macro variables, see Table 1.
                                  Figure 2 Add Field
                                  +
                                  Value: Enter ${timestamp()}. For more time macro variables, see Table 1.
                                  Figure 2 Add Field
                                  @@ -44,6 +44,36 @@ + + + + + + + + + + + + + + + + + + + +
                                  Table 1 Macro variable definition of time and date

                                  Macro Variable

                                  2017-10-15 09:00:00

                                  ${dateformat(yyyy-MM-dd, -1, DAY)} 00:00:00

                                  +

                                  Returns 00:00:00 of the day before the current day in yyyy-MM-dd HH:mm:ss format.

                                  +

                                  2017-10-15 00:00:00

                                  +

                                  ${dateformat(yyyy-MM-dd, -1, DAY)} 12:00:00

                                  +

                                  Returns 12:00:00 of the day before the current day in yyyy-MM-dd HH:mm:ss format.

                                  +

                                  2017-10-15 12:00:00

                                  +

                                  ${dateformat(yyyy-MM-dd, -N, DAY)} 00:00:00

                                  +

                                  Returns 00:00:00 of the day N days before the current day in yyyy-MM-dd HH:mm:ss format.

                                  +

                                  When N is 3:

                                  +

                                  2017-10-13 00:00:00

                                  +

                                  ${dateformat(yyyy-MM-dd, -N, DAY)} 12:00:00

                                  +

                                  Returns 12:00:00 of the day N days before the current day in yyyy-MM-dd HH:mm:ss format.

                                  +

                                  When N is 3:

                                  +

                                  2017-10-13 12:00:00

                                  +

                                  ${timestamp()}

                                  Returns the timestamp of the current time, that is, the number of milliseconds that have elapsed since 00:00:00 on January 1, 1970.

                                  @@ -95,3 +125,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0110.html b/docs/dataartsstudio/umn/dataartsstudio_01_0110.html index 4a86aa09e..1952b5395 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0110.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0110.html @@ -6,21 +6,19 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0111.html b/docs/dataartsstudio/umn/dataartsstudio_01_0111.html index c05de40f5..0e5a3efb2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0111.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0111.html @@ -8,7 +8,7 @@ - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0112.html b/docs/dataartsstudio/umn/dataartsstudio_01_0112.html index 9136eec99..bcfbcea7a 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0112.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0112.html @@ -6,7 +6,7 @@
                                  1. Exporting the files in a specified directory
                                    • Application scenarios: The migration source is a file system (OBS/HDFS/FTP/SFTP). In incremental migration, only the specified files are written to the migration destination. The existing records are not updated or deleted.
                                    • Key configurations: File/Path Filter and Schedule Execution
                                    • Prerequisites: The source directory or file name contains the time field.
                                  2. Exporting the files modified after the specified time point
                                    • Application scenarios: The migration source is a file system (OBS/HDFS/FTP/SFTP). The specified time point refers to the time when the file is modified. CDM migrates the files modified at or after the specified time point.
                                    • Key configurations: Time Filter and Schedule Execution
                                    • Prerequisites: None
                                  -

                                  If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                  +

                                  If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                  File/Path Filter

                                  • Parameter position: When creating a table/file migration job, if the migration source is a file system, set Filter Type in advanced attributes of Source Job Configuration to Wildcard or Regular expression.
                                  • Parameter principle: If you select Wildcard for Filter Type, CDM filters files or paths based on the configured wildcard character and migrates only files or paths that meet the specified condition.
                                  • Example configurations:
                                    Suppose that the source file name contains the date and time field, such as 2017-10-15 20:25:26, the /opt/data/file_20171015202526.data file is generated. Set the parameters as follows:
                                    1. Filter Type: Select Wildcard.
                                    2. File Filter: Enter "*${dateformat(yyyyMMdd,-1,DAY)}*", which is the format of the macro variables of date and time supported by CDM. For details, see Using Macro Variables of Date and Time.
                                    3. Schedule Execution: Set Cycle (days) to 1.
                                    @@ -14,7 +14,7 @@

                                    In this way, you can import the files generated in the previous day to the destination directory every day to implement incremental synchronization.

                                    In incremental file migration, Path Filter is used in the same way as File Filter. The path name must contain the time field. In this case, all files in the specified path can be synchronized periodically.

                                  -

                                  Time Filter

                                  • Parameter position: When creating a table/file migration job, if the migration source is a file system, set select Yes for Time Filter.
                                  • Parameter principle: After you specify the start time and end time, only files that are modified between the start time (included) and end time (excluded) will be migrated.
                                  • Example configurations:
                                    For example, if you want CDM to synchronize only the files generated from January 1, 2021 to January 1, 2022 to the destination, configure the following parameters:
                                    1. Time Filter: select Yes.
                                    2. Minimum Timestamp: Enter a value in the format of yyyy-MM-dd HH:mm:ss, such as 2021-01-01 00:00:00.
                                    3. Maximum Timestamp: Enter a value in the format of yyyy-MM-dd HH:mm:ss, such as 2022-01-01 00:00:00.
                                    +

                                    Time Filter

                                    • Parameter position: When creating a table/file migration job, if the migration source is a file system, set select Yes for Time Filter.
                                    • Parameter principle: After you specify the start time and end time, only files that are modified between the start time (included) and end time (excluded) will be migrated.
                                    • Example configurations:
                                      For example, if you want CDM to synchronize only the files generated from January 1, 2021 to January 1, 2022 to the destination, configure the following parameters:
                                      1. Time Filter: select Yes.
                                      2. Minimum Timestamp: Enter a value in the format of yyyy-MM-dd HH:mm:ss, such as 2021-01-01 00:00:00.
                                      3. Maximum Timestamp: Enter a value in the format of yyyy-MM-dd HH:mm:ss, such as 2022-01-01 00:00:00.

                                    In this way, the CDM job migrates only the files generated from January 1, 2021 to January 1, 2022, and performs incremental synchronization next time it is started.

                                    diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0113.html b/docs/dataartsstudio/umn/dataartsstudio_01_0113.html index 129734692..05cbcef69 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0113.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0113.html @@ -5,11 +5,11 @@
                                    • Migrating incremental data within a specified period of time
                                      • Application scenarios: The source end is a relational database. The destination end can be of any type.
                                      • Key configurations: WHERE Clause and Schedule Execution
                                      • Prerequisites: The data table contains a date and time field or timestamp field.

                                    In incremental migration, only the specified data is written to the data table. The existing records are not updated or deleted.

                                    -

                                    If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                    +

                                    If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                    WHERE Clause

                                    • Parameter position: When creating a table/file migration job, if the source end is a relational database, the Where Clause parameter is available in the advanced attributes of Source Job Configuration.
                                    • Parameter principle: Set WHERE Clause to an SQL statement, for example, age > 18 and age <= 60, CDM exports only the data that meets the SQL statement requirement. If WHERE Clause is not specified, the entire table is exported.

                                      Where Clause can be set to macro variables of date and time. When the data table contains the date or timestamp field, Where Clause and Schedule Execution can be used together to extract data of a specified date.

                                    • Example configurations:

                                      Suppose that the database table contains column DS indicating the time, the value type of the column is varchar(30), and the inserted time format is similar to 2017-xx-xx. See Figure 1. Set the parameters as follows:

                                      -
                                      Figure 1 Table data
                                      +
                                      Figure 1 Table data
                                      1. WHERE Clause: Set this parameter to DS='${dateformat(yyyy-MM-dd,-1,DAY)}'.
                                      2. Scheduling job execution: Set Cycle (days) to 1 and Start Time to 00:00:00.

                                      In this way, all data generated on the previous day can be exported at 00:00:00 every day. WHERE Clause can be configured to various macro variables of date and time. You can use the macro variables of date and time and scheduled jobs with specified cycle of minutes, hours, days, weeks, or months together to automatically export data at a specific time.

                                    diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0114.html b/docs/dataartsstudio/umn/dataartsstudio_01_0114.html index fba57e23a..89ee8d956 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0114.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0114.html @@ -5,18 +5,18 @@

                                    You can use the ${} macro variable definition identifier to define the macros of the time type. currently, dateformat and timestamp are supported.

                                    By using the macro variables of date and time and scheduled job, you can implement incremental synchronization of databases and files.

                                    -

                                    If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                    +

                                    If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                    dateformat

                                    dateformat supports two types of parameters:

                                    -
                                    • dateformat(format)

                                      format indicates the date and time format. For details about the format definition, see the definition in java.text.SimpleDateFormat.java.

                                      -

                                      For example, if the current date is 2017-10-16 09:00:00, yyyy-MM-dd HH:mm:ss indicates 2017-10-16 09:00:00.

                                      +
                                      • dateformat(format)

                                        format indicates the date and time format. For details about the format definition, see the definition in java.text.SimpleDateFormat.java.

                                        +

                                        For example, if the current date is 2017-10-16 09:00:00, yyyy-MM-dd HH:mm:ss indicates 2017-10-16 09:00:00.

                                      • dateformat(format, dateOffset, dateType)
                                        • format indicates the format of the returned date.
                                        • dateOffset indicates the date offset.
                                        • dateType indicates the type of the date offset.

                                          Currently, dateType supports SECOND, MINUTE, HOUR, MONTH, YEAR, and DAY.

                                          Pay attention to the following special scenarios of MONTH and YEAR:

                                          • If the date does not exist after the offset, the latest date of the month in the calendar is used.
                                          • These two offset types cannot be used for the start time and end time in the Time Filter parameter of the source and destination jobs.
                                        -

                                        For example, if the current date is 2023-03-01 09:00:00, then:

                                        -
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, YEAR) indicates the year before the current time, that is, 2022-03-01 09:00:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -3, MONTH) indicates three months before the current time, that is, 2022-12-01 09:00:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY) indicates the day before the current time, that is, 2023-02-28 09:00:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, HOUR) indicates one hour before the current time, that is, 2023-03-01 08:00:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, MINUTE) indicates one minute before the current time, that is, 2023-03-01 08:59:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, SECOND) indicates one second before the current time, that is, 2023-03-01 08:59:59.
                                        +

                                        For example, if the current date is 2023-03-01 09:00:00, then:

                                        +
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, YEAR) indicates the year before the current time, that is, 2022-03-01 09:00:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -3, MONTH) indicates three months before the current time, that is, 2022-12-01 09:00:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY) indicates the day before the current time, that is, 2023-02-28 09:00:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, HOUR) indicates one hour before the current time, that is, 2023-03-01 08:00:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, MINUTE) indicates one minute before the current time, that is, 2023-03-01 08:59:00.
                                        • dateformat(yyyy-MM-dd HH:mm:ss, -1, SECOND) indicates one second before the current time, that is, 2023-03-01 08:59:59.

                                    timestamp

                                    timestamp supports two types of parameters:

                                    @@ -26,76 +26,108 @@

                                  Macro Variable Definition of Time and Date

                                  Suppose that the current time is 2017-10-16 09:00:00, then Table 1 describes the macro variable definitions of time and date.

                                  +

                                  The examples in the table must be embedded in ''. For example, '${dateformat(yyyy-MM-dd)}' returns the current time in yyyy-MM-dd format.

                                  +
                                  -
                                  + + + +
                                  Table 1 Macro variable definition of time and date

                                  Macro Variable

                                  +
                                  - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + @@ -105,11 +137,11 @@

                                  Time and Date Macro Variables of Paths and Table Names

                                  Figure 1 shows an example. If:
                                  • Table Name under Source Link Configuration is set to CDM_/${dateformat(yyyy-MM-dd)}.
                                  • Write Directory under Destination Link Configuration is set to /opt/ttxx/${timestamp()}.

                                  After the macro definition conversion, this job indicates that data in table SQOOP.CDM_20171016 in the Oracle database is migrated to the /opt/ttxx/1508115701746 directory of the HDFS server.

                                  -
                                  Figure 1 Setting Table Name and Write Directory to a time and date macro variable
                                  +
                                  Figure 1 Setting Table Name and Write Directory to a time and date macro variable

                                  Currently, a table name or path name can contain multiple macro variables. For example, /opt/ttxx/${dateformat(yyyy-MM-dd)}/${timestamp()} is converted to /opt/ttxx/2017-10-16/1508115701746.

                                  Time and Date Macro Variables in the Where Clause

                                  Figure 2 uses table SQOOP.CDM_20171016 as an example. The table contains column DS, which indicates the time.

                                  -
                                  Figure 2 Table data
                                  +
                                  Figure 2 Table data

                                  Suppose that the current date is 2017-10-16 and you want to export data generated the day before the current day (DS = 2017-10-15), then you can set the value of Where Clause to DS='${dateformat(yyyy-MM-dd,-1,DAY)}' when creating a job. In this way, you can export all data that complies with the DS = 2017-10-15 condition.

                                  Implementing Incremental Synchronization by Configuring the Macro Variables of Date and Time and Scheduled Jobs

                                  Two simple application scenarios are as follows:

                                  @@ -121,7 +153,14 @@
                                  + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0115.html b/docs/dataartsstudio/umn/dataartsstudio_01_0115.html index b555875a6..f3366a254 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0115.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0115.html @@ -1,18 +1,19 @@ -

                                  Creating a DataArts Studio Basic Package

                                  -

                                  Background

                                  • Only users who have the DARTS Administrator or Tenant Administrator permissions can create DataArts Studio instances or DataArts Studio incremental packages. To allow users to create instances or incremental packages, you must grant the required permissions to them.

                                    Users with the Tenant Administrator permissions can perform all operations except IAM user management. For security purposes, you are not advised to grant the Tenant Administrator permissions to IAM users.

                                    +

                                    Creating a DataArts Studio Instance

                                    +

                                    Context

                                    • Only users with DARTS Administrator or Tenant Administrator permissions can create DataArts Studio instances or incremental packages.

                                      Users with Tenant Administrator permissions can perform all operations except IAM user management. For security purposes, you are not advised to grant Tenant Administrator permissions to IAM users.

                                      -
                                    • Only users who have the Security Administrator permissions can create cloud service agencies. Cloud service agencies allow DataArts Studio to perform operations such as task scheduling and resource O&M on cloud services on your behalf.
                                    +
                                  • Only users with Security Administrator permissions can create cloud service agencies. Cloud service agencies allow DataArts Studio to perform operations such as task scheduling and resource O&M on other cloud services on your behalf.

                                    +

                                  Prerequisites

                                  You have obtained a VPC, subnet, and security group. You can also apply for them when you create a DataArts Studio instance.

                                  -

                                  Logging In to DataArts Studio Console

                                  1. Log in to the cloud console.
                                  2. In the upper left corner of the console, click , and choose DataArts Studio to access the DataArts Studio console.
                                  +

                                  Logging In to the DataArts Studio Console

                                  1. Log in to the cloud console.
                                  2. In the upper left corner of the console, click , and choose to access the DataArts Studio console.
                                  -

                                  Creating a DataArts Studio Basic Package

                                  1. On the DataArts Studio console, click Create Instance.
                                  2. On the displayed page, set parameters for the DataArts Studio instance. Table 1 provides descriptions of the parameters.

                                    +

                                    create a DataArts Studio Basic Package

                                    1. On the DataArts Studio console, click create Instance.
                                    2. On the displayed page, set the parameters listed in Table 1.

                                  Table 1 Macro variable definition of time and date

                                  Macro Variable

                                  Description

                                  +

                                  Description

                                  Display Effect

                                  +

                                  Display Effect

                                  ${dateformat(yyyy-MM-dd)}

                                  +

                                  ${dateformat(yyyy-MM-dd)}

                                  Returns the current date in yyyy-MM-dd format.

                                  +

                                  Returns the current date in yyyy-MM-dd format.

                                  2017-10-16

                                  +

                                  2017-10-16

                                  ${dateformat(yyyy/MM/dd)}

                                  +

                                  ${dateformat(yyyy/MM/dd)}

                                  Returns the current date in yyyy/MM/dd format.

                                  +

                                  Returns the current date in yyyy/MM/dd format.

                                  2017/10/16

                                  +

                                  2017/10/16

                                  ${dateformat(yyyy_MM_dd HH:mm:ss)}

                                  +

                                  ${dateformat(yyyy_MM_dd HH:mm:ss)}

                                  Returns the current time in yyyy_MM_dd HH:mm:ss format.

                                  +

                                  Returns the current time in yyyy_MM_dd HH:mm:ss format.

                                  2017_10_16 09:00:00

                                  +

                                  2017_10_16 09:00:00

                                  ${dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY)}

                                  +

                                  ${dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY)}

                                  Returns the current time in yyyy-MM-dd HH:mm:ss format. The date is one day before the current day.

                                  +

                                  Returns the current time in yyyy-MM-dd HH:mm:ss format. The date is one day before the current day.

                                  2017-10-15 09:00:00

                                  +

                                  2017-10-15 09:00:00

                                  ${timestamp()}

                                  +

                                  ${dateformat(yyyy-MM-dd, -1, DAY)} 00:00:00

                                  Returns the timestamp of the current time, that is, the number of milliseconds that have elapsed since 00:00:00 on January 1, 1970.

                                  +

                                  Returns 00:00:00 of the day before the current day in yyyy-MM-dd HH:mm:ss format.

                                  1508115600000

                                  +

                                  2017-10-15 00:00:00

                                  ${timestamp(-10, MINUTE)}

                                  +

                                  ${dateformat(yyyy-MM-dd, -1, DAY)} 12:00:00

                                  Returns the timestamp generated 10 minutes before the current time point.

                                  +

                                  Returns 12:00:00 of the day before the current day in yyyy-MM-dd HH:mm:ss format.

                                  1508115000000

                                  +

                                  2017-10-15 12:00:00

                                  ${timestamp(dateformat(yyyyMMdd))}

                                  +

                                  ${dateformat(yyyy-MM-dd, -N, DAY)} 00:00:00

                                  Returns the timestamp of 00:00:00 of the current day.

                                  +

                                  Returns 00:00:00 of the day N days before the current day in yyyy-MM-dd HH:mm:ss format.

                                  1508083200000

                                  +

                                  When N is 3:

                                  +

                                  2017-10-13 00:00:00

                                  ${timestamp(dateformat(yyyyMMdd,-1,DAY))}

                                  +

                                  ${dateformat(yyyy-MM-dd, -N, DAY)} 12:00:00

                                  Returns the timestamp of 00:00:00 of the previous day.

                                  +

                                  Returns 12:00:00 of the day N days before the current day in yyyy-MM-dd HH:mm:ss format.

                                  1507996800000

                                  +

                                  When N is 3:

                                  +

                                  2017-10-13 12:00:00

                                  ${timestamp(dateformat(yyyyMMddHH))}

                                  +

                                  ${timestamp()}

                                  Returns the timestamp of the current hour.

                                  +

                                  Returns the timestamp of the current time, that is, the number of milliseconds that have elapsed since 00:00:00 on January 1, 1970.

                                  1508115600000

                                  +

                                  1508115600000

                                  +

                                  ${timestamp(-10, MINUTE)}

                                  +

                                  Returns the timestamp generated 10 minutes before the current time point.

                                  +

                                  1508115000000

                                  +

                                  ${timestamp(dateformat(yyyyMMdd))}

                                  +

                                  Returns the timestamp of 00:00:00 of the current day.

                                  +

                                  1508083200000

                                  +

                                  ${timestamp(dateformat(yyyyMMdd,-1,DAY))}

                                  +

                                  Returns the timestamp of 00:00:00 of the previous day.

                                  +

                                  1507996800000

                                  +

                                  ${timestamp(dateformat(yyyyMMddHH))}

                                  +

                                  Returns the timestamp of the current hour.

                                  +

                                  1508115600000

                                  - @@ -20,9 +21,9 @@ - - @@ -38,23 +41,23 @@ -
                                  Table 1 DataArts Studio instance parameters

                                  Parameter

                                  Example

                                  +

                                  Example Value

                                  Description

                                  Region

                                  None

                                  +

                                  N/A

                                  The region where the instance resides. Resources in different regions cannot communicate with each other.

                                  +

                                  Region where the instance resides. Resources in different regions cannot communicate with each other.

                                  Enterprise Project

                                  @@ -30,7 +31,9 @@

                                  default

                                  Enterprise project associated with the default workspace of the DataArts Studio instance.

                                  -
                                  This parameter is available only when an enterprise project has been created. If you want to connect the DataArts Studio instance to a cloud service (such as DWS, MRS, and RDS), ensure that the enterprise project of the DataArts Studio workspace is the same as that of the cloud service instance.
                                  • You can create only one DataArts Studio instance for an enterprise project.
                                  • If you want to enable communication between DataArts Studio and another cloud service, ensure that the enterprise project of DataArts Studio is the same as that of the cloud service.
                                  +
                                  This parameter is available only when an enterprise project has been created. If you want to connect the DataArts Studio instance to an instance of another cloud service, such as GaussDB(DWS), MRS, and RDS, ensure that the enterprise project of the DataArts Studio instance's workspace is the same as that of the target cloud service instance.
                                  • You can create only one DataArts Studio instance for an enterprise project.
                                  • If you want to enable communication between DataArts Studio and another cloud service, ensure that the enterprise project of DataArts Studio is the same as that of the target cloud service.
                                  +
                                  NOTE:

                                  If the enterprise project function is not enabled, only one DataArts Studio instance can be created for each IAM project.

                                  +

                                  DataArts Studio-test

                                  Name of the DataArts Studio instance The instance name cannot be changed.

                                  +

                                  Name of the DataArts Studio instance. After the instance is created, its name cannot be changed.

                                  -

                                4. Confirm the settings and click create Now.
                                5. When you return to the DataArts Studio management console, the Authorize Access dialog box is displayed, prompting you to authorize the listed services. DataArts Studio interacts with the cloud services and needs to collaborate with them. Therefore, you need to create a cloud service agency to delegate permissions to DataArts Studio so that DataArts Studio can use these cloud services and perform task scheduling and resource O&M on behalf of you.

                                  Only users who have the Security Administrator permissions can create cloud service agencies. Cloud service agencies allow DataArts Studio to perform operations such as task scheduling and resource O&M on cloud services on your behalf.

                                  +

                                6. Confirm the settings and click create Now.
                                7. When you return to the DataArts Studio console, the Authorize Access dialog box is displayed, prompting you to authorize the listed services. DataArts Studio interacts with these cloud services. You must create a cloud service agency to delegate permissions to DataArts Studio so that DataArts Studio can use these cloud services and perform task scheduling and resource O&M on your behalf.

                                  Only users with Security Administrator permissions can create cloud service agencies. Cloud service agencies allow DataArts Studio to perform operations such as task scheduling and resource O&M on other cloud services on your behalf.

                                  Cloud service agencies include permissions related to DWS, MRS, RDS, OBS, SMN, and KMS. You can access the IAM agency page to view the agency scope. You do not need to apply for an agency for users. The agency of the account is used.

                                  -
                                  Select all services and click Authorize. The platform automatically creates the default agency dlg_agency.
                                  • After the authorization is complete, the Authorize Access dialog box will not be displayed when you access the DataArts Studio console homepage next time.
                                  • If you select only some services for authorization, the system still displays the dialog box next time you access the DataArts Studio console homepage, prompting you to authorize access to unauthorized cloud services.
                                  +
                                  Select all services and click Authorize. The system automatically creates the default dlg_agency.
                                  • After the authorization is complete, the Authorize Access dialog box will not be displayed when you access the DataArts Studio console homepage next time.
                                  • If you select only some services for authorization, this dialog box will be displayed again next time you access the DataArts Studio console, prompting you to authorize access to the unauthorized cloud services.
                                  -

                                8. In the list of instances, locate your instance and click Access to access the DataArts Studio console.
                                9. +

                                10. In the list of instances, locate your instance and click Access to access the DataArts Studio console.
                                11. diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0115_0.html b/docs/dataartsstudio/umn/dataartsstudio_01_0115_0.html deleted file mode 100644 index 0e3f090a2..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0115_0.html +++ /dev/null @@ -1,19 +0,0 @@ - - -

                                  HBase/CloudTable Incremental Migration

                                  -

                                  You can use CDM to export data in a specified period of time from HBase (including MRS HBase, FusionInsight HBase, and Apache HBase) and CloudTable. The CDM scheduled jobs can be used together to implement incremental migration of HBase and CloudTable.

                                  -

                                  If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                  -
                                  -

                                  When creating a table/file migration job and selecting the link to HBase or CloudTable as the source link, you can set the time range in advanced attributes.

                                  -
                                  Figure 1 Time range
                                  -
                                  • Start time (including the value) for extracting data. The format is yyyy-MM-dd HH:mm:ss. Only the data generated at the specified time and later is extracted.
                                  • End time (excluding the value) for extracting data. The format is yyyy-MM-dd HH:mm:ss. Only the data generated before the time point is extracted.
                                  -

                                  The two parameters can be set to macro variables of date and time. Examples are as follows:

                                  -
                                  • If Minimum Timestamp is set to ${dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY)}, only the data generated after the day before is exported.
                                  • If Maximum Timestamp is set to ${dateformat(yyyy-MM-dd HH:mm:ss)}, only the data generated before the specified time point is exported.
                                  -

                                  If both parameters are configured, CDM exports only the data generated on the previous day. In addition, if the job is configured to execute at 00:00:00 every day, the data generated every day can be incrementally synchronized.

                                  -
                                  -
                                  - -
                                  - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0116.html b/docs/dataartsstudio/umn/dataartsstudio_01_0116.html index 4c84b90a8..f4851ce33 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0116.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0116.html @@ -1,81 +1,94 @@ -

                                  Creating and Managing a Workspace

                                  -

                                  The system will create a default workspace and assign the admin role to you after you create a DataArts Studio instance. can use the default workspace or create a new workspace.

                                  +

                                  Creating a Workspace in Simple Mode

                                  +

                                  The system creates a default workspace named default for the DataArts Studio instance you create and assigns administrator permissions to you. You can use the default workspace or create another workspace.

                                  A workspace in a DataArts Studio instance is the basic unit for member management and role and permission allocation. It provides all DataArts Studio functions. Workspaces are allocated by branch or subsidiary (such as the group, subsidiary, and department), business domain (such as the procurement, production, and sales), or implementation environment (such as the development, test, and production environment). There are no fixed rules.

                                  -

                                  Admins can manage user (member) permissions, resources, and compute engines in a workspace. To enable users to work together, admins can add users to a workspace and assign the preset roles of DataArts Studio (admin, developer, operator, and visitor) to the users. Users other than admins can access Management Center, DataArts Migration, and DataArts Factory only after they are added to a workspace and assigned relevant roles.

                                  -

                                  Constraints

                                  • There is no limit on the number of workspaces that can be created for a DataArts Studio instance. You can plan the quota as needed.
                                  • The storage of job logs and dirty data depends on the OBS service.
                                  +

                                  As an admin, you can manage user (member) permissions, resources, and compute engines for a workspace. To enable users to work together, admins can add users to a workspace and assign the preset roles of DataArts Studio (admin, developer, operator, and visitor) to the users. Users other than admins can access Management Center, DataArts Migration, and DataArts Factory only after they are added to a workspace and assigned relevant roles.

                                  +

                                  Notes and Constraints

                                  • There is no limit on the number of workspaces that can be created for a DataArts Studio instance.
                                  • The storage of job logs and dirty data depends on the OBS service.
                                  -

                                  Prerequisites

                                  You have created a DataArts Studio instance by referring to Creating a DataArts Studio Basic Package.

                                  +

                                  Prerequisites

                                  You have obtained a DataArts Studio instance. For details, see Creating a DataArts Studio Instance.

                                  -

                                  Background

                                  • The system will create a default workspace and assign the admin role to you after you create a DataArts Studio instance.
                                  • In a DataArts Studio instance created by a master account, if an IAM user of the account needs to create a workspace, the IAM user must be assigned the DARTS Administrator or Tenant Administrator policy. By default, the master account has all the permissions for a DataArts Studio instance created by a sub-user.
                                  • Users assigned the permissions of DARTS User can access a workspace only after they are added as members of the workspace.
                                  +

                                  Context

                                  • The system creates a default workspace named default for the DataArts Studio instance you create and assigns admin role to you.
                                  • In a DataArts Studio instance created by an account, if an IAM user of the account needs to create a workspace, the IAM user must be assigned the DARTS Administrator or Tenant Administrator permissions. By default, the account has all the permissions for a DataArts Studio instance created by a user of the account.
                                  • Users with the DARTS User permissions can access a workspace only after they are added as members of the workspace.
                                  -

                                  Creating a Workspace

                                  1. Log in to the DataArts Studio console as user DARTS Administrator or Tenant Administrator. For details, see Accessing the DataArts Studio Instance Console.
                                  2. On the Workspaces page, click Create. In the displayed dialog box, set parameters based on Table 1.

                                    Figure 1 Creating a workspace
                                    +

                                    Creating a Workspace

                                    1. Log in to the DataArts Studio console as user DARTS Administrator or Tenant Administrator. For details, see Accessing the DataArts Studio Instance Console.
                                    2. On the Workspaces page, click Create Workspace. In the displayed dialog box, set the parameters listed in Table 1.

                                      Figure 1 Creating a workspace

                                      -
                                      @@ -102,6 +104,8 @@ @@ -225,7 +229,7 @@ - @@ -254,7 +258,7 @@
                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0123.html b/docs/dataartsstudio/umn/dataartsstudio_01_0123.html index 6ba1db2ee..f26a600e7 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0123.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0123.html @@ -1,10 +1,10 @@ -

                                      Configuring Alarm Rules

                                      +

                                      Configuring CDM Alarm Rules

                                      Scenario

                                      Set the alarm rules to customize the monitored objects and notification policies. Then, learn CDM running status in a timely manner.

                                      A CDM alarm rule includes the alarm rule name, monitored object, metric, threshold, monitoring interval, and whether to send a notification. This section describes how to set CDM alarm rules.

                                      -

                                      Procedure

                                      1. Access the CDM console, choose Cluster Management. Locate a cluster, click More in the Operation column, and select View Metric from the drop-down list.
                                      2. In the navigation pane, choose Cloud Service Monitoring > Cloud Data Migration. In the right pane, locate a CDM cluster and click Create Alarm Rule in the Operation column.

                                        Figure 1 Monitored CDM clusters
                                        +

                                        Procedure

                                        1. Access the CDM console, choose Cluster Management. Locate a cluster, click More in the Operation column, and select View Metric from the drop-down list.
                                        2. In the navigation pane, choose Cloud Service Monitoring > Cloud Data Migration. In the right pane, locate a CDM cluster and click Create Alarm Rule in the Operation column.

                                          Figure 1 Monitored CDM clusters

                                        3. Set the alarm rule for the CDM cluster as prompted.
                                        4. After the setting is complete, click Confirm. When an alarm that meets the rule is generated, the system automatically sends a notification.

                                          For more information about monitoring and alarms, see the Cloud Eye User Guide.

                                        @@ -12,7 +12,14 @@
                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0124.html b/docs/dataartsstudio/umn/dataartsstudio_01_0124.html index 0e58998ea..7cbc975b5 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0124.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0124.html @@ -1,6 +1,6 @@ -

                                        Querying Metrics

                                        +

                                        Querying CDM Metrics

                                        Scenario

                                        You can use Cloud Eye to monitor the running status of a CDM cluster. You can view the monitoring metrics on the Cloud Eye console.

                                        Monitored data takes some time for transmission and display. The status displayed on the Cloud Eye console is the status obtained 5 to 10 minutes before. You can view the monitored data of a newly created CDM cluster 5 to 10 minutes later.

                                        @@ -8,13 +8,20 @@
                                      3. The cluster has been properly running for about 10 minutes.

                                        The monitored data and graphs are available for a newly created cluster after the cluster runs for at least 10 minutes.

                                      -

                                      Procedure

                                      1. Access the CDM console, choose Cluster Management. Locate a cluster, click More in the Operation column, and select View Metric from the drop-down list.
                                      2. On the CDM monitoring page, you can view the graphs of all monitoring metrics.

                                        Figure 1 Querying Metrics
                                        -

                                      3. Click in the upper right corner of the graphs to zoom in the graphs.
                                      4. You can select a time period in the upper left corner to view metric changes in this time period.
                                      +

                                      Procedure

                                      1. Access the CDM console, choose Cluster Management. Locate a cluster, click More in the Operation column, and select View Metric from the drop-down list.
                                      2. On the CDM monitoring page, you can view the graphs of all monitoring metrics.

                                        Figure 1 Querying Metrics
                                        +

                                      3. Click in the upper right corner of the graphs to zoom in the graphs.
                                      4. You can select a time period in the upper left corner to view metric changes in this time period.
                                      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0125.html b/docs/dataartsstudio/umn/dataartsstudio_01_0125.html index 7b7009439..f71d97595 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0125.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0125.html @@ -2,10 +2,10 @@

                                      MongoDB/DDS Incremental Migration

                                      By using CDM, you can export MongoDB or DDS data within a specified period. With the scheduled jobs of CDM, you can implement incremental migration of MongoDB and DDS.

                                      -

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      +

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      When creating a table/file migration job and selecting the link to MongoDB or DDS as the source link, you can set the query filters in advanced attributes.

                                      -
                                      Figure 1 Setting query filters
                                      +
                                      Figure 1 Setting query filters

                                      You can set this parameter to a macro variable of date and time, for example, {"ts":{$gte:ISODate("${dateformat(yyyy-MM-dd'T'HH:mm:ss.SSS'Z',-1,DAY)}")}}, which indicates searching for the values in the ts field that are greater than those after time macro conversion, that is, only the data generated after the previous day is exported.

                                      After this parameter is set, CDM exports only the data generated on the previous day. In addition, you can set the job to be executed at 00:00:00 every day, so that the data generated every day can be incrementally synchronized.

                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0126.html b/docs/dataartsstudio/umn/dataartsstudio_01_0126.html index e18a09f0c..fd9f31d2c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0126.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0126.html @@ -1,6 +1,6 @@ -

                                      DataArts Migration Operations

                                      +

                                      Key CDM Operations Recorded by CTS

                                      CTS provides records of operations on cloud service resources. With CTS, you can query, audit, and backtrack those operations.

                                      Table 1 Parameters for creating a workspace

                                      Parameter

                                      +
                                      - - - - - - - - - - - - -
                                      Table 1 Parameters for creating a workspace

                                      Parameter

                                      Description

                                      +

                                      Description

                                      Name

                                      +

                                      Name

                                      Workspace names can contain only letters, numbers, underscores (_), and hyphens (-). They cannot exceed 32 characters. In a DataArts Studio instance, workspace names must be unique.

                                      +

                                      Workspace name. It can contain a maximum of 32 characters, including only letters, digits, underscores (_), and hyphens (-). The workspace name must be unique in the current DataArts Studio instance.

                                      Description

                                      +

                                      Description

                                      A description of the workspace.

                                      +

                                      Workspace description

                                      Mode

                                      +

                                      Mode

                                      Workspace mode

                                      -
                                      • Simple: This traditional mode is easy to use but does not allow you to strictly control the data development process and table permissions.
                                      • Enterprise: You can isolate the development environment from the production environment in the DataArts Factory and Management Center modules of DataArts Studio. This prevents developers' operations from affecting services in the production environment. For details about the enterprise mode, see DataArts Studio Enterprise Mode Overview.
                                      +

                                      Select the workspace mode.

                                      +
                                      • Simple: This mode is easy to use, but does not allow you to strictly control data development processes and table permissions.
                                      • Enterprise: In this mode, you can isolate the development environment from the production environment in the DataArts Factory and Management Center modules of DataArts Studio. This prevents developers' operations from affecting services in the production environment. For details about the enterprise mode, see Enterprise Mode Overview.

                                      Enterprise Project

                                      +

                                      Enterprise Project

                                      Enterprise project associated with the default workspace of the DataArts Studio instance.

                                      -
                                      This parameter is available only when an enterprise project has been created. If you want to connect the DataArts Studio instance to a cloud service (such as DWS, MRS, and RDS), ensure that the enterprise project of the DataArts Studio workspace is the same as that of the cloud service instance.
                                      • You can only create one DataArts Studio instance in an enterprise project.
                                      • If you want to enable communication between DataArts Studio and another cloud service, ensure that the enterprise project of DataArts Studio is the same as that of the cloud service.
                                      +

                                      Enterprise project associated with the default workspace of the DataArts Studio instance.

                                      +
                                      This parameter is available only when an enterprise project has been created. If you want to connect the DataArts Studio instance to an instance of another cloud service, such as GaussDB(DWS), MRS, and RDS, ensure that the enterprise project of the DataArts Studio instance's workspace is the same as that of the target cloud service instance.
                                      • You can create only one DataArts Studio instance for an enterprise project.
                                      • If you want to enable communication between DataArts Studio and another cloud service, ensure that the enterprise project of DataArts Studio is the same as that of the target cloud service.
                                      +
                                      NOTE:

                                      If the enterprise project function is not enabled, only one DataArts Studio instance can be created for each IAM project.

                                      +

                                      OBS Bucket for Job Logs

                                      +

                                      Job Log Path

                                      The OBS bucket for storing logs of DataArts Studio data development jobs. To use the DataArts Factory module of DataArts Studio, workspace members must have the read and write permissions on the OBS bucket for storing job logs. Otherwise, the system cannot read or write job logs generated during data development.

                                      -
                                      • Click Select. You can select a created OBS bucket. The selected OBS bucket is globally configured in the current workspace.
                                      • If this parameter is not set, job logs generated during data development are stored in the OBS bucket named dlf-log-{projectId} by default. {projectId} indicates the project ID, which can be obtained by referring to Obtaining a Project ID and Account ID.
                                      +

                                      OBS bucket for storing the job logs of DataArts Factory of DataArts Studio. To use the DataArts Factory module of DataArts Studio, workspace members must have the read and write permissions on the OBS bucket for storing job logs. Otherwise, the system cannot read or write job logs of DataArts Factory.

                                      +
                                      • Click Select. You can select an existing OBS bucket. The selected OBS bucket is globally configured in the current workspace.
                                      • If this parameter is not set, job logs generated during data development are stored in the OBS bucket named dlf-log-{projectId} by default. {projectId} indicates the project ID, which can be obtained in the following way:
                                        1. Register with and log in to the management console.
                                        2. Hover the cursor on the username in the upper right corner and select My Credentials from the drop-down list.
                                        3. On the API Credentials page, obtain the account name, account ID, IAM username, and IAM user ID, and obtain the project and its ID from the project list.
                                        +
                                      +
                                      NOTE:

                                      The execution logs of data development jobs are stored in xxxxx.log format in an OBS bucket. xxxxx indicates the job ID. Deleting the historical records of SQL statements that have been executed does not affect services.

                                      +

                                      OBS Bucket for DLI Dirty Data

                                      +

                                      Dirty Data Path

                                      The OBS bucket for storing dirty data generated during DLI SQL execution in DataArts Studio Data Development. To use DataArts Studio DataArts Factory to develop and execute DLI SQL statements, workspace members must have the read and write permissions on the OBS bucket where DLI dirty data is stored. Otherwise, the system cannot read or write the dirty data generated during DLI SQL execution.

                                      -
                                      • Click Select. You can select a created OBS bucket. The selected OBS bucket is globally configured in the current workspace.
                                      • If this parameter is not set, dirty data generated during DLI SQL execution is stored in the OBS bucket named dlf-log-{projectId} by default.
                                      +

                                      OBS bucket for storing dirty data generated during DLI SQL execution in DataArts Factory of DataArts Studio. To use DataArts Factory to develop and execute DLI SQL statements, workspace members must have the read and write permissions on the OBS bucket where DLI dirty data is stored. Otherwise, the system cannot read or write the dirty data generated during DLI SQL execution.

                                      +
                                      • Click Select. You can select a created OBS bucket. The selected OBS bucket is globally configured in the current workspace.
                                      • If you do not set this parameter, dirty data generated during DLI SQL execution is stored in the OBS bucket named dlf-log-{projectId} by default.
                                      -

                                    3. Click OK.
                                    4. +

                                    5. Click OK.
                                    6. -

                                      Related Operations

                                      • Disable a workspace: After a workspace is created, it is enabled by default. You can disable or enable it as needed.

                                        On the Workspaces page, locate the target workspace, and click in the Status column to disable the workspace. In the displayed Disable Workspace dialog box, learn about the impact of disabling the workspace and click Yes to disable the workspace.

                                        -

                                        If you disable a workspace, you cannot access the workspace, edit the workspace, view quotas of the workspace, or schedule jobs in the workspace.

                                        +

                                        Related Operations

                                        • Disabling a workspace: After a workspace is created, it is enabled by default. If you do not need a workspace, you can disable it. If you want to use it in the future, you can enable it again.

                                          On the Workspaces page, locate the target workspace, click More in the Operation column, and select Disable Workspace. In the Disable Workspace dialog box displayed, read the impact of disabling a workspace. If you want to continue, click Yes.

                                          +

                                          If you disable a workspace, you cannot access the workspace, edit the workspace, or view the quota of the workspace. In addition, jobs being scheduled in the workspace will stop.

                                          -
                                        • Enable a workspace: On the Workspaces page, locate the target workspace, and click in the Status column to enable the workspace. In the displayed Enable Workspace dialog box, click Yes.
                                        • Edit a workspace: On the Workspaces page, locate the target workspace, and click Edit in the Operation column. In the displayed Workspace Information dialog box, modify the workspace parameters listed in Table 1 and click OK.
                                        • Add/Edit a tag: On the Workspaces page, locate a workspace, click More in the Operation column, and select tags. In the displayed tags dialog box, click Add/Edit Tag to associate tags with the workspace.
                                        • View quota usage: On the Workspaces page, locate a workspace and click Quota Usage in the Operation column. In the displayed Quota Usage dialog box, you can view the quota usage of each service in the workspace.
                                        • Pin a workspace to top: On the Workspaces tab page, locate the target workspace, click More in the Operation column, and select Pin to Top.
                                        • Delete a workspace: On the Workspaces page, locate the target workspace, click More in the Operation column, and select Delete. In the displayed Delete Workspace dialog box, click OK.

                                          To prevent service loss caused by mis-deletion, the system allows only the DARTS Administrator or Tenant Administrator to delete workspaces. Before deleting a workspace, ensure that no resource is available in any of the following modules:

                                          +
                                        • Enabling a workspace: On the Workspaces page, locate the workspace you want to enable, click More in the Status column, and select Enable Workspace. In the Enable Workspace dialog box displayed, read the impact of enabling a workspace. If you want to continue, click Yes.
                                        • Editing a workspace: On the Workspaces page, locate the workspace you want to edit and click Edit in the Operation column. In the displayed Workspace Information dialog box, modify workspace parameters by referring to Table 1 and click OK.

                                          When editing a workspace, you can add workspace members (see Adding Workspace Members and Assigning Roles).

                                          +
                                        • Viewing the quota usage: On the Workspaces page, locate a workspace and click Quota Usage in the Operation column. In the displayed Quota Usage dialog box, you can view the quota usage of each module.
                                        • Pinning a workspace to top: On the Workspaces page, locate a workspace, click More in the Operation column, and select Pin to Top.
                                        • Deleting a workspace: On the Workspaces page, locate a workspace, click More in the Operation column, and select Delete. In the Delete Workspace dialog box, click OK.

                                          Mis-deletion may result in service loss. To delete a workspace, you must use the DARTS Administrator or Tenant Administrator account and ensure that the workspace does not contain any of the following resources:

                                          • Management Center: data connections
                                          • DataArts Migration: CDM clusters
                                          • DataArts Factory: jobs, job directories, scripts, script directories, and resources
                                          -

                                          If any component of a workspace has any service resource, deleting the workspace will fail.

                                          +

                                          If any module has resources, a message is displayed, indicating that the workspace cannot be deleted.

                                          If any module has resources, delete the resources as prompted and try again.

                                          -
                                          Figure 2 Message indicating that the workspace cannot be deleted
                                          +
                                          Figure 2 Message indicating that the workspace cannot be deleted

                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0116_0.html b/docs/dataartsstudio/umn/dataartsstudio_01_0116_0.html deleted file mode 100644 index 5a55e96e0..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0116_0.html +++ /dev/null @@ -1,16 +0,0 @@ - - -

                                        Migration in Transaction Mode

                                        -

                                        When a CDM job fails to be executed, CDM rolls back the data to the state before the job starts and automatically deletes data from the destination table.

                                        -
                                        • Parameter position: When creating a table/file migration job, if the migration source is a relational database, set Import to Staging Table in the advanced attributes of Destination Job Configuration to determine whether to enable the transaction mode.
                                        • Parameter principle: If you set this parameter to Yes, CDM automatically creates a temporary table and imports the data to the temporary table. After the data is imported successfully, CDM migrates the data to the destination table in transaction mode of the database. If the import fails, the destination table is rolled back to the state before the job starts.
                                          Figure 1 Migration in transaction mode
                                          -

                                          -
                                        -

                                        If you select Clear part of data or Clear all data for Clear Data Before Import, CDM does not roll back the deleted data in transaction mode.

                                        -
                                        -
                                        -
                                        - -
                                        - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0117.html b/docs/dataartsstudio/umn/dataartsstudio_01_0117.html index 30457c75a..7cbe1bf6d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0117.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0117.html @@ -1,26 +1,27 @@ -

                                        Adding a Member and Assigning a Role

                                        -

                                        For IAM users with the DARTS User permission, a workspace role determines their permissions in the workspace. If you want to allow another IAM user with the DARTS User permission to use your DataArts Studio instance, create an IAM user by referring to Creating an IAM User and Assigning DataArts Studio Permissions, and add the user as the workspace member and configure a role for the user by following the instructions in this section.

                                        -

                                        A workspace role determines the permissions of a user in the workspace. Currently, the following preset roles are available: admin, developer, deployer, operator, and viewer. You can also customize roles based on (Optional) Defining a Workspace Role. For details about the permissions of each role, see "DataArts Studio Permissions" in Service Overview.

                                        +

                                        Adding Workspace Members and Assigning Roles

                                        +

                                        For IAM users with DARTS User account permissions, their permissions in a DataArts Studio workspace are determined by workspace roles. If you want to share a DataArts Studio instance with an IAM user with the DARTS User account permissions, prepare an IAM user by referring to Creating an IAM User and Assigning DataArts Studio Permissions, add the user as a workspace member, and assign a role to the member.

                                        +
                                        Figure 1 Permission system
                                        +

                                        A workspace role determines the permissions of a user in a workspace. Preset roles include admin, developer, deployer, operator, and viewer. You can also customize roles by referring to (Optional) Defining a Workspace Role. For the detailed descriptions of the permissions of each role, see "Permissions" in Service Overview.

                                        • Admin: This role has all operation permissions in a workspace. You are advised to assign the admin role to the project owner, development owner, and O&M administrator.
                                        • Developer: This role has permissions to create and manage resources in a workspace. You are advised to assign this role to users who develop and process tasks.
                                        • Operator: This role has the operation permissions of services such as O&M and scheduling in a workspace, but cannot modify resources or configurations. You are advised to assign this role to users responsible for O&M management and status monitoring.
                                        • Viewer: This role can view data in a workspace but cannot perform any other operation. You are advised to assign this role to users who only need to view data in a workspace but do not need to perform operations.
                                        • Deployer: This role is unique to the enterprise mode and has permissions to release task packages in a workspace. In enterprise mode, when a developer submits a script or job version, the system generates a release task. After the developer confirms the release and the deployer approves the release request, the modified job is synchronized to the production environment.
                                        • Custom roles: If the preset roles cannot meet your requirements, you can create custom roles. You can configure permissions for such roles to meet the the principle of least privilege (PoLP).
                                        -

                                        Background

                                        If the permissions of DARTS User has been assigned to the created IAM user, you must add workspace members and roles. Otherwise, the IAM user cannot view existing DataArts Studio workspaces.

                                        +

                                        Context

                                        If an IAM user is granted the DARTS User permissions, you also need to add the user as a workspace member and assign a role to the user. Otherwise, the IAM user cannot view existing DataArts Studio workspaces.

                                        -

                                        Constraints

                                        Due to the limitation of the authentication cache mechanism, changes to the roles of workspace members do not take effect immediately. Instead, the changes take effect only after the workspace members stop accessing the DataArts Studio console and wait for 6 minutes.

                                        +

                                        Notes and Constraints

                                        Due to the limitations of the authentication cache mechanism, a change to the role of a workspace member does not take effect immediately. The change takes effect six minutes after the workspace member stops accessing the DataArts Studio console.

                                        -

                                        Prerequisites

                                        You have changed your account to either of the following:
                                        • DARTS Administrator or Tenant Administrator
                                        • DARTS User, which is the workspace administrator
                                        +

                                        Prerequisites

                                        You are using either of the following accounts:
                                        • DARTS Administrator or Tenant Administrator
                                        • DARTS User, which is the administrator of the current workspace
                                        -

                                        Adding a Member and Assigning a Role

                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                        2. On the Workspaces page, locate the target workspace and click Edit in the Operation column.

                                          Figure 1 Workspace Information dialog box
                                          -

                                          -

                                          -

                                        3. Click Add under Workspace Members. In the displayed Add Member dialog box, select Add User or Add Group, select a member account from the drop-down list, and select a role for it.

                                          Figure 2 Adding a member
                                          +

                                          Adding a Member and Assigning a Role

                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                          2. On the Workspaces page, locate the target workspace and click Edit in the Operation column.

                                            Figure 2 Workspace Information dialog box
                                            +

                                            +

                                            +

                                          3. Click Add next to Workspace Members. In the displayed Add Member dialog box, select User or Group for Account Type, select a user or group from the Member Account drop-down list, and select a role.

                                            Figure 3 Adding a member

                                            -

                                          4. Click OK. You can view or modify the members and roles in the member list, or remove members from the workspace.
                                          +

                                        4. Click OK. You can view or modify the members and roles in the member list, or delete members from the workspace.
                                        -

                                        Related Operations

                                        • Remove workspace members: In the Workspace Information dialog box, select the members to remove and click Remove. In the Remove Member dialog box, click Yes.

                                          The creator of a workspace cannot be removed.

                                          +

                                          Related Operations

                                          • Removing a workspace member: In the Workspace Information dialog box, select the workspace members to remove, and click Remove. In the Remove Member dialog box, click Yes.

                                            The creator of a workspace cannot be removed.

                                            -
                                            Figure 3 Removing members
                                            +
                                            Figure 4 Removing a member

                                          @@ -31,3 +32,10 @@
                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0117_0.html b/docs/dataartsstudio/umn/dataartsstudio_01_0117_0.html deleted file mode 100644 index 30bc711e9..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0117_0.html +++ /dev/null @@ -1,32 +0,0 @@ - - -

                                          Encryption and Decryption During File Migration

                                          -
                                          When you migrate files to a file system, CDM can encrypt and decrypt those files. Currently, CDM supports the following encryption modes: -
                                          -

                                          AES-256-GCM

                                          Currently, only AES-256-GCM (NoPadding) is supported. This algorithm is used for encryption at the migration destination and decryption at the migration source. The supported source and destination data sources are as follows:

                                          -
                                          • Data sources supported by the migration source: HDFS (supported in the binary format)
                                          • Data sources supported by the migration destination: HDFS (supported in the binary format)
                                          -

                                          The following part describes how to use AES-256-GCM to decrypt the encrypted files to be exported from HDFS and encrypt the files to be imported to HDFS.

                                          -
                                          • Configure decryption at the migration source.
                                            When you use CDM to create a job for exporting files from HDFS, set the migration source to HDFS and file format to binary, and set the following parameters in the advanced settings of Source Job Configuration:
                                            1. Encryption: Select AES-256-GCM.
                                            2. DEK: The key must be the same as that configured in encryption. Otherwise, the decrypted data is incorrect and the system does not display an error message.
                                            3. IV: The initialization vector must be the same as that configured in encryption. Otherwise, the decrypted data is incorrect and the system does not display an error message.
                                            -
                                            -

                                            In this way, after CDM exports encrypted files from HDFS, the files written to the migration destination are decrypted plaintext files.

                                            -
                                          -
                                          • Configure encryption at the migration destination.
                                            When you create a CDM job to import files to HDFS, set the migration destination to HDFS and file format to binary, and set the following parameters in the advanced settings of Destination Job Configuration:
                                            1. Encryption: Select AES-256-GCM.
                                            2. DEK: custom encryption key. The key consists of 64 hexadecimal numbers. It is case-insensitive but must contain 64 characters. For example, DD0AE00DFECD78BF051BCFDA25BD4E320DB0A7AC75A1F3FC3D3C56A457DCDC1B.
                                            3. IV: custom initialization vector. The initialization vector consists of 32 hexadecimal numbers. It is case-insensitive but must contain 32 characters. For example, 5C91687BA886EDCD12ACBC3FF19A3C3F.
                                            -
                                            -

                                            In this way, after CDM imports files to HDFS, the files in the destination HDFS are encrypted using the AES-256-GCM algorithm.

                                            -
                                          -
                                          -

                                          KMS Encryption

                                          The migration source does not support KMS encryption.

                                          -
                                          -

                                          CDM supports KMS encryption if tables, files, or a whole database is migrated to OBS. In the Advanced Attributes area of the Destination Job Configuration page, set the parameters.

                                          -

                                          A key must be created in KMS of DEW in advance. For details, see the Data Encryption Workshop User Guide.

                                          -

                                          After KMS encryption is enabled, objects to be uploaded will be encrypted and stored on OBS. When you download the encrypted objects, the encrypted data will be decrypted on the server and displayed in plaintext to users.

                                          -
                                          • If KMS encryption is enabled, MD5 verification cannot be used.
                                          • If the KMS ID of another project is used, change Project ID to the ID of the project to which KMS belongs. If KMS and CDM are in the same project, retain the default value of Project ID.
                                          • After KMS encryption is performed, the encryption status of the objects on OBS cannot be changed.
                                          • A key in use cannot be deleted. Otherwise, the object encrypted with this key cannot be downloaded.
                                          -
                                          -
                                          -
                                          -
                                          - -
                                          - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0118.html b/docs/dataartsstudio/umn/dataartsstudio_01_0118.html index 324195630..d1ff29275 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0118.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0118.html @@ -1,19 +1,19 @@

                                          Authorizing Users to Use DataArts Studio

                                          -
                                          +
                                          diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0118_0.html b/docs/dataartsstudio/umn/dataartsstudio_01_0118_0.html deleted file mode 100644 index a8ee7ec4a..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0118_0.html +++ /dev/null @@ -1,18 +0,0 @@ - - -

                                          MD5 Verification

                                          -

                                          CDM extracts data from the migration source and writes the data to the migration destination. Figure 1 shows the migration mode when files are migrated to OBS.

                                          -
                                          Figure 1 Migrating files to OBS
                                          -

                                          During the process, CDM uses MD5 to verify file consistency.

                                          -
                                          • Extract
                                            • The migration source can be OBS, HDFS, FTP, SFTP, or HTTP. It can check whether the files extracted by CDM are consistent with source files.
                                            • This function is controlled by the MD5 File Extension parameter (available when File Format is set to Binary) in Source Job Configuration. Set this parameter to the file name extension of the MD5 file in the source file system.
                                            • If a source file build.sh and a file for saving MD5 value build.sh.md5 are located in the same directory, and MD5 File Extension is configured, only the file build.sh.md5 is migrated to the destination. Files without the MD5 value or whose MD5 values do not match fail to be migrated, and the MD5 file is not migrated.
                                            • If MD5 File Extension is not configured, all files are migrated.
                                            -
                                          • Write
                                            • Currently, this function can be used only when OBS serves as the migration destination. It can check whether the files written to OBS are consistent with those extracted from CDM.
                                            • This function is controlled by the Validate MD5 Value parameter in Destination Job Configuration. After the files are read and written to OBS, the MD5 value in the HTTP header is used to verify the files on OBS and the verification result is written to an OBS bucket (the bucket can be the one that does not store migration files). If the migration source does not have the MD5 file, the verification will not be performed.
                                            -
                                          -
                                          • When files are migrated to a file system, only the extracted files are verified.
                                          • When files are migrated to OBS, both the extracted files and files written to OBS are verified.
                                          • If MD5 verification is used, KMS encryption cannot be used.
                                          -
                                          -
                                          -
                                          - -
                                          - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0119.html b/docs/dataartsstudio/umn/dataartsstudio_01_0119.html index 80caceeb8..3a0f39f0c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0119.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0119.html @@ -1,13 +1,13 @@ -

                                          (Optional) Creating a DataArts Studio Incremental Package

                                          -

                                          DataArts Studio provides basic and incremental packages. If the basic package cannot meet your requirements, you can create an incremental package. Before you create an incremental package, ensure that you have a DataArts Studio instance.

                                          -

                                          DataArts Studio provides the following types of incremental packages:

                                          -
                                          • DataArts Migration incremental package

                                            CDM clusters can migrate data to the cloud and integrate data into the data lake. It provides wizard-based configuration and management and can integrate data from a single table or an entire database incrementally or periodically. The DataArts Studio instance has no CDM cluster. To use CDM functions, you must create a DataArts Migration incremental package.

                                            -
                                          -

                                          Background

                                          • If you create a DataArts Migration incremental package, the system automatically creates a CDM cluster based on the specifications you select.
                                          • If you create a DataArts DataService incremental package, the system automatically creates a DataArts DataService cluster based on the specifications you select.
                                          • You can choose More > View Packages to view incremental packages.
                                          +

                                          Creating a DataArts Migration Incremental Package

                                          +

                                          A DataArts Migration (that is, CDM) incremental package provides resources for a CDM cluster. When you create a CDM incremental package, the system automatically creates a CDM cluster based on the specifications you select for the incremental package.

                                          +
                                          CDM clusters can be used in the following scenarios:
                                          • Data migration jobs can be created and run in CDM clusters to migrate data to the cloud or import data to the data lake.
                                          • CDM clusters can be used as agents of data connections in Management Center, which enable communications between DataArts Studio instances and data sources.
                                          -

                                          Creating a CDM Cluster

                                          1. Locate an enabled instance and click Create.
                                          1. On the displayed page, set parameters based on Table 1. +

                                            A DataArts Studio instance does not contain CDM clusters. To use CDM clusters, create DataArts Migration incremental packages.

                                            +

                                            Context

                                            • When you create a DataArts Migration (CDM) incremental package, the system automatically creates a CDM cluster based on the specifications you select for the incremental package.
                                            • You can locate a DataArts Studio instance, click More, and select View Packages to view your incremental packages.
                                            +
                                            +

                                            Creating a CDM Cluster

                                            1. Locate an enabled instance and click Create.
                                            1. On the displayed page, set parameters based on Table 1.
                                              - - - - - - - - - - - - @@ -86,12 +75,12 @@

                                              You cannot modify the specifications of an existing cluster. If you need higher specifications, create another cluster.

                                              -
                                            2. Click Create Now, confirm the specifications, and click Next.
                                            3. View the CDM cluster in the corresponding workspace.
                                            4. +
                                            5. Click Create Now, confirm the specifications, and click Next.
                                            6. Go to the corresponding workspace to view the CDM cluster you have created.
                                            7. diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0120.html b/docs/dataartsstudio/umn/dataartsstudio_01_0120.html index 779880c1f..f926c83cd 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0120.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0120.html @@ -1,23 +1,54 @@ -

                                              (Optional) Defining a Workspace Role

                                              -

                                              For IAM users with the DARTS User permission, a workspace role determines their permissions in the workspace. Currently, five preset roles are available: admin, developer, deployer, operator, and viewer. For details about the permissions of each role, see "DataArts Studio Permissions" in Service Overview.

                                              -

                                              If the preset roles can meet your requirements, skip this section. Otherwise, create custom roles by following the instructions in this section.

                                              -

                                              Background

                                              • The DARTS Administrator or Tenant Administrator account can create custom roles in a workspace.
                                              -
                                              -

                                              Constraints

                                              • Due to the restriction of the authentication cache mechanism, when the permission of a custom role changes, the change does not take effect immediately for the workspace members with this role. The permission change takes effect only after the workspace members with this role stop accessing the DataArts Studio console and wait for 6 minutes.
                                              • Even if a custom role has the same permissions as the admin, the custom role cannot perform some operations that require the admin role for example, exporting all the APIs in DataArts DataService.
                                              -
                                              -

                                              Procedure

                                              1. Log in to the DataArts Studio console as DARTS Administrator or Tenant Administrator. For details, see Accessing the DataArts Studio Instance Console.
                                              2. On the Roles page, click Create. In the displayed dialog box, set the following parameters:

                                                • Role Name: unique identifier of a custom role. You are advised to name the role to fit its application scenario and avoid any meaningless description.
                                                • Role Description: description of the role, for example, the key permission differences between the role and preset roles
                                                • Role Type: The role permissions in simple mode differ from those in enterprise mode. Select an appropriate role type based on the scenario. For details about the enterprise mode, see DataArts Studio Enterprise Mode Overview.
                                                  • If the role is used in a workspace in simple mode, select CUSTOM.
                                                  • If the role is used in the development environment of a workspace in enterprise mode, select DEV_CUSTOM.
                                                  • If the role is used in the production environment of a workspace in enterprise mode, select PROD_CUSTOM.
                                                  -
                                                • Reuse: Use this function if you only need to slightly adjust the permissions of the preset roles to meet your requirements. Otherwise, you can directly select permissions for the role.

                                                  When you create or edit a role, if your account has the DARTS Administrator or Tenant Administrator permission but the system still displays an error message indicating that you do not have the permission to perform this operation, you are advised to change another network and try again.

                                                  -
                                                  +

                                                  From DLI

                                                  +

                                                  If the source link of a job is a DLI link, configure the source job parameters based on Table 1.

                                                  + +
                                              Table 1 Parameters for the CDM incremental package

                                              Parameter

                                              Description

                                              @@ -16,68 +16,57 @@

                                              Package

                                              Select DataArts Migration.

                                              +

                                              Select DataArts Migration.

                                              AZ

                                              When you create a DataArts Studio instance or incremental package for the first time, there is no requirement on the AZ.

                                              -
                                              When you create a new DataArts Studio instance or incremental package, determine whether to select the same AZ as the existing one based on your DR and network latency demands.
                                              • If your application requires good DR capability, deploy resources in different AZs in the same region.
                                              • If your application requires a low network latency between instances, deploy resources in the same AZ.
                                              +

                                              When you your first DataArts Studio instance or incremental package, you can select any available AZ.

                                              +
                                              When you create another DataArts Studio instance or incremental package, determine whether to select the same AZ as the first instance or incremental package based on your DR and network latency demands.
                                              • If your application requires good DR capability, select an AZ different from that of the first instance or incremental package in the same region.
                                              • If your application requires a low network latency between instances, select the same AZ as the first instance or incremental package.

                                              Workspace

                                              Select the workspace where the DataArts Migration incremental package will be used. The CDM cluster can only be used in this workspace.

                                              +

                                              Select the workspace where the CDM incremental package is to be used. A CDM cluster can be used in a workspace only after the CDM cluster is associated with the workspace.

                                              Enterprise Project

                                              If the CDM cluster is associated with multiple workspaces, you need to specify an enterprise project for the CDM cluster.

                                              +

                                              If the CDM cluster is associated with multiple workspaces, select an enterprise project for the CDM cluster.

                                              Cluster

                                              +

                                              Cluster Name

                                              Customize the cluster name.

                                              Instance

                                              +

                                              Instance Type

                                              The following CDM cluster flavors are available:

                                              -
                                              • cdm.large: 8 vCPUs and 16 GB of memory. The maximum and assured bandwidths are 3 Gbit/s and 0.8 Gbit/s. Up to 16 jobs can be executed concurrently.
                                              • cdm.xlarge: 16 vCPUs and 32 GB of memory. The maximum and assured bandwidths are 10 Gbit/s and 4 Gbit/s. Up to 32 jobs can be executed concurrently. This flavor is suitable for migrating terabytes of data that requires a bandwidth of 10GE.
                                              • cdm.4xlarge: 64 vCPUs and 128 GB of memory. The maximum and assured bandwidths are 40 Gbit/s and 36 Gbit/s. Up to 128 jobs can be executed concurrently.
                                              • The free ECS with 4 vCPUs and 8 GB memory provided by DataArts Studio can run only one job.
                                              +
                                              • cdm.large: the large flavor with 8 vCPUs and 16 GB of memory. The maximum and assured bandwidths are 3 Gbit/s and 0.8 Gbit/s. Up to 16 jobs can be executed concurrently.
                                              • cdm.xlarge: the ultra-large flavor with 16 vCPUs and 32 GB of memory. The maximum and assured bandwidths are 10 Gbit/s and 4 Gbit/s. Up to 32 jobs can be executed concurrently. This flavor is suitable for migrating terabytes of data that requires a bandwidth of 10GE.
                                              • cdm.4xlarge: the 4x ultra-large flavor with 64 vCPUs and 128 GB of memory. The maximum and assured bandwidths are 40 Gbit/s and 36 Gbit/s. Up to 128 jobs can be executed concurrently.

                                              VPC

                                              VPC to which the CDM cluster in the DataArts Studio instance belongs. A VPC is a secure, isolated, and logical network environment.

                                              -

                                              If you want to connect the DataArts Studio instance or CDM cluster to a cloud service (such as DWS, MRS, and RDS), ensure that the CDM cluster can communicate with the cloud service. If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If the CDM cluster and the cloud service are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules.

                                              -

                                              For details about the operations on VPCs, subnets, and security groups, see Virtual Private Cloud User Guide.

                                              -
                                              NOTE:

                                              After the CDM instance is created, the VPC cannot be changed.

                                              +

                                              VPC, subnet, and security group to which the CDM cluster in the DataArts Studio instance belongs.

                                              +

                                              If you want to connect the DataArts Studio instance or CDM cluster to a cloud service such as GaussDB(DWS), MRS, and RDS, ensure that the CDM cluster can communicate with the cloud service. If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If the CDM cluster and the cloud service are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules.

                                              +

                                              For details about the operations on VPCs, subnets, and security groups, see Virtual Private Cloud User Guide.

                                              +
                                              NOTE:
                                              • After the CDM cluster is created, its VPC, subnet, and security group cannot be changed. Set them carefully.
                                              • You can select a VPC subnet shared by the VPC owner when you create a CDM cluster. Through VPC subnet sharing, you can easily configure and manage multiple accounts' resources at low costs. For details about how to share a VPC subnet, see "VPC Sharing" in Virtual Private Cloud User Guide.

                                              Subnet

                                              -

                                              Subnet to which the CDM cluster in the DataArts Studio instance belongs. A subnet provides dedicated network resources that are isolated from other networks, improving network security.

                                              -

                                              If you want to connect the DataArts Studio instance or CDM cluster to a cloud service (such as DWS, MRS, and RDS), ensure that the CDM cluster can communicate with the cloud service. If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If the CDM cluster and the cloud service are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules.

                                              -

                                              For details about the operations on VPCs, subnets, and security groups, see Virtual Private Cloud User Guide.

                                              -
                                              NOTE:

                                              After the CDM instance is created, the VPC cannot be changed.

                                              -
                                              +

                                              Subnet

                                              Security Group

                                              -

                                              Security group to which the CDM cluster in the DataArts Studio instance belongs. A security group is a set of ECS access rules. It provides access policies for ECSs that have the same security protection requirements and are mutually trusted in a VPC.

                                              -

                                              If you want to connect the DataArts Studio instance or CDM cluster to a cloud service (such as DWS, MRS, and RDS), ensure that the CDM cluster can communicate with the cloud service. If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If the CDM cluster and the cloud service are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules.

                                              -

                                              For details about the operations on VPCs, subnets, and security groups, see Virtual Private Cloud User Guide.

                                              -
                                              NOTE:

                                              After the CDM instance is created, the security group cannot be changed.

                                              -
                                              +

                                              Security Group

                                              IPv6 Dual Stack

                                              If you enable this function, both private IPv4 and IPv6 addresses can be used to access the cluster.

                                              -
                                              NOTE:
                                              • If you enable this function, you can only select subnets for which IPv6 CIDR blocks are enabled. If you want to select a subnet for which IPv6 CIDR blocks are disabled, enable IPv6 CIDR blocks for the subnet in the VPC service.
                                              • IPv6 dual stack can be enabled for private IP addresses, but not for public IP addresses.
                                              +

                                              Whether to enable IPv6 dual stack.

                                              +

                                              If you enable this function, both private IPv4 and IPv6 addresses can be used to access the cluster.

                                              +
                                              NOTE:
                                              • If you enable this function, you can only select subnets for which IPv6 CIDR blocks are enabled. If IPv6 CIDR blocks are disabled for the subnet you want to select, enable IPv6 CIDR blocks for the subnet in the VPC service.
                                              • IPv6 dual stack can be enabled for private IP addresses, but not for public IP addresses.
                                              + + + + + + + + + + + + + + + + + + + + + +
                                              Table 1 Parameter description

                                              Parameter

                                              +

                                              Description

                                              +

                                              Example Value

                                              +

                                              Resource Queue

                                              +

                                              Resource queue to which the destination table belongs

                                              +

                                              The default queue of DLI cannot be used for migration jobs. You need to create a SQL queue in DLI.

                                              +

                                              cdm

                                              +

                                              Database Name

                                              +

                                              Name of the database to which data will be written

                                              +

                                              dli

                                              +

                                              Table Name

                                              +

                                              Name of the table to which data will be written

                                              +

                                              car_detail

                                              +

                                              Partition

                                              +

                                              Partition information

                                              +
                                              • ['year=2020']
                                              • ['year=2020,location=sun']
                                              • ['year=2020,location=sun', 'year=2021,location=earth']
                                              • Read data of the previous day:

                                                If the current date is 2024-07-16, ['DS=${dateformat(yyyy-MM-dd, -1, DAY)}'] indicates that the data whose DS partition value is 2024-07-15 is extracted.

                                                +

                                                For details about other scenarios, see Using Macro Variables of Date and Time.

                                              -

                                              -

                                            8. After configuring the role name, type, and permissions, click OK.
                                            9. Set the IAM user as a custom role by referring to Adding a Member and Assigning a Role.
                                            10. +
                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0120_0.html b/docs/dataartsstudio/umn/dataartsstudio_01_0120_0.html deleted file mode 100644 index 7aeb26aa9..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0120_0.html +++ /dev/null @@ -1,52 +0,0 @@ - - -

                                            From DLI

                                            -

                                            If the source link of a job is a DLI link, configure the source job parameters based on Table 1.

                                            - -
                                            - - - - - - - - - - - - - - - - - - - - - -
                                            Table 1 Parameter description

                                            Parameter

                                            -

                                            Description

                                            -

                                            Example Value

                                            -

                                            Resource Queue

                                            -

                                            Resource queue to which the destination table belongs

                                            -

                                            The default queue of DLI cannot be used for migration jobs. You need to create a SQL queue in DLI.

                                            -

                                            cdm

                                            -

                                            Database Name

                                            -

                                            Name of the database to which data will be written

                                            -

                                            dli

                                            -

                                            Table Name

                                            -

                                            Name of the table to which data will be written

                                            -

                                            car_detail

                                            -

                                            Partition

                                            -

                                            Partition information

                                            -

                                            year=2020,location=sun

                                            -
                                            -
                                            -
                                            -
                                            - -
                                            - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0121.html b/docs/dataartsstudio/umn/dataartsstudio_01_0121.html index 642db53c0..a93c0cad7 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0121.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0121.html @@ -1,19 +1,19 @@ -

                                            Viewing Metrics

                                            +

                                            Managing and Viewing CDM Metrics

                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0122.html b/docs/dataartsstudio/umn/dataartsstudio_01_0122.html index f7c34c3ee..21cc8d94f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0122.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0122.html @@ -3,7 +3,7 @@

                                            CDM Metrics

                                            Function

                                            Cloud Eye monitors the running status of cloud services and usage of each metric, and creates alarm rules for monitoring metrics.

                                            After you create a CDM cluster, Cloud Eye automatically associates with CDM monitoring metrics to help you understand the running status of the CDM cluster.

                                            -
                                            • This section describes the CDM metrics that can be monitored by Cloud Eye as well as their namespaces and dimensions.
                                            • For details about CDM monitoring metrics, see Querying Metrics.
                                            • For details about how to set alarm rules, see Configuring Alarm Rules.
                                            +
                                            • This section describes the CDM metrics that can be monitored by Cloud Eye as well as their namespaces and dimensions.
                                            • For details about CDM monitoring metrics, see Querying CDM Metrics.
                                            • For details about how to set alarm rules, see Configuring CDM Alarm Rules.

                                            Prerequisites

                                            You have obtained required Cloud Eye permissions.

                                            @@ -88,6 +88,8 @@

                                      Number of jobs in the PENDING state in the CDM instance.

                                      Unit: count

                                      +
                                      NOTE:

                                      This metric is available in version 2.10.0.300 and later versions.

                                      +

                                      >=0

                                      Number of concurrent extraction threads in the Waiting state in the CDM instance.

                                      Unit: count

                                      +
                                      NOTE:

                                      This metric is available in version 2.10.0.300 and later versions.

                                      +

                                      >=0

                                      Measures the disk inodes usage of the physical server accommodating the monitored ECS, which is not accurate as that obtained on the monitored ECS.

                                      Unit: %

                                      0.001% to 0.9%

                                      +

                                      0.001% to 100%

                                      Cloud Data Migration

                                      - - - - - - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0462.html b/docs/dataartsstudio/umn/dataartsstudio_01_0462.html index a94ed3491..21af46204 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0462.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0462.html @@ -56,7 +56,7 @@ + + + +
                                      Table 1 Key operations recorded by CTS

                                      Operation

                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0127.html b/docs/dataartsstudio/umn/dataartsstudio_01_0127.html index 097ca3b46..68aeb427a 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0127.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0127.html @@ -8,8 +8,8 @@

                                      Procedure

                                      1. Log in to the management console and choose Cloud Trace Service from the service list.
                                      2. The trace list is displayed by default. You can filter traces.
                                        The sources of DataArts Studio traces include:
                                        • CDM: traces of DataArts Migration
                                        • DLF: traces of DataArts Factory
                                        • DLG: traces of Management Center, DataArts Architecture, DataArts Quality, DataArts Catalog, and DataArts DataService
                                        -
                                        Figure 1 CDM traces
                                        -
                                      3. Click on the left of a trace to expand its details.
                                      4. Click View Trace in the Operation column to view the trace structure details.

                                        For more information about CTS, see Cloud Trace Service User Guide.

                                        +
                                        Figure 1 CDM traces
                                        +
                                      5. Click on the left of a trace to expand its details.
                                      6. Click View Trace in the Operation column to view the trace structure details.

                                        For more information about CTS, see Cloud Trace Service User Guide.

                                      @@ -19,3 +19,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0128.html b/docs/dataartsstudio/umn/dataartsstudio_01_0128.html deleted file mode 100644 index a971ba887..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0128.html +++ /dev/null @@ -1,38 +0,0 @@ - - -

                                      Managing Agents

                                      -

                                      If your data is stored in HDFS or a relational database, you can deploy an agent on the source network. CDM pulls data from your internal data sources through an agent but cannot write data into the databases.

                                      -
                                      Figure 1 Scenario
                                      -

                                      -

                                      Figure 2 shows the process of using an agent.

                                      -
                                      Figure 2 Process
                                      -

                                      Prerequisites

                                      • A CDM cluster is available.
                                      • A Linux server (for example, a Linux ECS) is available. The Linux server has no special requirements for vCPUs, memory, and disks, but must meet the following requirements:
                                        • Java 8 (64-bit) has been installed and Java environment variables have been configured.
                                        • User Ruby must be granted the write permission of the /tmp directory. If there is no user Ruby, create one.
                                        -
                                      -
                                      -

                                      Creating an Agent

                                      1. Access the CDM console and choose Cluster Management in the left navigation pane. Locate the target cluster, choose Job Management > Agent Management > Create Agent, and configure agent parameters.

                                        Figure 3 Creating an agent
                                        -
                                        • IP Address: Set this parameter to the IP address of the server where the agent is deployed on the source network.
                                        • Port: custom port of the agent Recommended value range: 1024–65535.
                                        • Enable Compression: whether to compress data using the gzip algorithm.
                                          • Enable this function for text data (data based on character encoding, such as MySQL INT data) because such data can be well compressed by the gzip algorithm. (For details about text data, see the related database documentation.)
                                          • Disable this function for binary data (data based on value encoding, such as MySQL BINARY data) because such data has been compressed, and compressing it again will increase the workload to decompress data and undermine the performance of the client. (For details about text data, see the related database documentation.)
                                          -
                                        • Enable SSL: whether to enable two-way SSL authentication Enable this function if security is of high priority.
                                        • Bandwidth Throttling: set the maximum downstream rate of the agent. By default, there is no throttling.
                                        -

                                      2. Click OK. On the Agent Management page, view the created agent.
                                      -
                                      -

                                      Installing and Starting an Agent

                                      1. On the Agent Management page, locate the created agent and click Download in the Operation column.

                                        Figure 4 Downloading an agent
                                        -

                                      2. Upload the downloaded agent package to the target Linux server.

                                        The Linux server has no special requirements for vCPUs, memory, and disks, but must meet the following requirements:

                                        -
                                        • Java 8 (64-bit) has been installed and Java environment variables have been configured.
                                        • User Ruby must be granted the write permission of the /tmp directory. If there is no user Ruby, create one.
                                        -
                                        -

                                      3. Decompress the package and run the following command to install the agent:

                                        sh sbin/install.sh

                                        -

                                      4. If you want to use the agent to connect to a relational database, you need to upload the corresponding drivers (see Managing Drivers) to the /server/jdbc directory in the agent installation directory and modify the version number of the corresponding database driver in the properties file in the same directory.
                                      5. Run the following command as user root to change the owner and group of the driver uploaded to the /server/jdbc directory to Ruby:

                                        chown Ruby.Ruby * -R

                                        -

                                      6. After the installation is complete, run the following commands to start the agent:

                                        su Ruby

                                        -

                                        sh sbin/start.sh

                                        -

                                      7. Run the following command to check whether the agent is started:

                                        ps -ef | grep cdm

                                        -

                                        If the command output contains the running agent process, the agent process has been started.

                                        -

                                      -
                                      -

                                      Connecting to an Agent

                                      1. On the Agent Management page, locate the created agent and click Connect in the Operation column.

                                        Figure 5 Connecting to an agent
                                        -

                                      2. After the agent is successfully connected, you can select it when creating a connection.
                                      -
                                      -
                                      -
                                      - -
                                      - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0130.html b/docs/dataartsstudio/umn/dataartsstudio_01_0130.html index a06dd2942..716d85050 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0130.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0130.html @@ -3,10 +3,10 @@

                                      Creating an MRS Hive Link

                                      MRS Hive links are applicable to the MapReduce Service (MRS). This tutorial describes how to create an MRS Hive link.

                                      -

                                      Prerequisites

                                      • You have created a CDM cluster.
                                      • You have obtained the Manager IP address, and administrator account and password of the MRS cluster, and the account has the permissions to import and export data.
                                      • The MRS cluster and the CDM cluster can communicate with each other. The following requirements must be met for network interconnection:
                                        • If the CDM cluster and the cloud service are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, the host where the data source is located can access the Internet, and the port has been enabled in the firewall rules.
                                        • If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                        • The cloud service instance and the CDM cluster belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                        +

                                        Prerequisites

                                        • You have created a CDM cluster.
                                        • You have obtained the Manager IP address, and administrator account and password of the MRS cluster, and the account has the permissions to import and export data.
                                        • The MRS cluster and the CDM cluster can communicate with each other. The following requirements must be met for network interconnection:
                                          • If the CDM cluster and the cloud service are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, the host where the data source is located can access the Internet, and the port has been enabled in the firewall rules.
                                          • If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                          • The cloud service instance and the CDM cluster belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                        -

                                        Creating an MRS Hive Link

                                        1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.

                                          Figure 1 Selecting a connector type
                                          +

                                          Creating an MRS Hive Link

                                          1. On the Cluster Management page, locate a cluster and click Job Management in the Operation column. On the displayed page, click the Links tab and then Create Link.

                                            Figure 1 Selecting a connector type

                                          2. Select MRS Hive and click Next to configure parameters for the MRS Hive link.
                                          3. Click Show Advanced Attributes to view more optional parameters. Retain their default values. The following table lists the mandatory parameters.

                                            @@ -25,7 +25,9 @@ - @@ -72,7 +74,7 @@ - - - @@ -63,7 +63,7 @@ - @@ -78,23 +78,40 @@
                                          4. If the data source is MySQL, PostgreSQL, or DM, you can obtain the access address from the database administrator.
                                          5. + + + + - - + + + + @@ -103,7 +120,14 @@ + + + + @@ -136,7 +160,7 @@
                                            Table 1 MRS Hive link parameters

                                            Parameter

                                            Manager IP

                                            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.

                                            +
                                            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
                                            NOTE:

                                            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                            +
                                            +

                                            127.0.0.1

                                            ldapUsername

                                            This parameter is mandatory when Enable ldap is enabled.

                                            +

                                            This parameter is mandatory when Enable ldap is enabled.

                                            Enter the username configured when LDAP authentication was enabled for MRS Hive.

                                            -

                                            @@ -80,7 +82,7 @@

                                            ldapPassword

                                            This parameter is mandatory when Enable ldap is enabled.

                                            +

                                            This parameter is mandatory when Enable ldap is enabled.

                                            Enter the password configured when LDAP authentication was enabled for MRS Hive.

                                            -

                                            @@ -97,7 +99,7 @@

                                            This parameter is mandatory when OBS storage support is enabled. The account corresponding to the AK/SK pair must have the OBS Buckets Viewer permission. Otherwise, OBS cannot be accessed and the "403 AccessDenied" error is reported.

                                            You need to create an access key for the current account and obtain an AK/SK pair.

                                            -
                                            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 2.
                                              Figure 2 Clicking Create Access Key
                                              +
                                              1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                              2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 2.
                                                Figure 2 Clicking Create Access Key
                                              3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                                                NOTE:
                                                • Only two access keys can be added for each user.
                                                • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
                                              @@ -156,3 +158,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0131.html b/docs/dataartsstudio/umn/dataartsstudio_01_0131.html index 1f086f7fd..6a81b96aa 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0131.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0131.html @@ -6,8 +6,8 @@

                                              Creating a MySQL Link

                                              1. Access the CDM console, choose Cluster Management in the navigation pane, locate the target cluster, and choose Job Management > Link Management > Driver Management. The Driver Management page is displayed.
                                              2. On the Driver Management page, click the document link in the Recommended Version column of the MySQL driver and obtain the driver file as instructed.
                                              3. On the Driver Management page, upload the MySQL driver using either of the following methods:

                                                Click Upload in the Operation column and select a local driver.

                                                Alternatively, click Copy from SFTP in the Operation column and configure the SFTP Link name and Driver File Path.

                                                -

                                              4. On the Cluster Management page, click Job Management of the cluster and choose Links > Create Link to enter the page for selecting the connector.

                                                Figure 1 Selecting a connector type
                                                -

                                              5. Select MySQL and click Next to configure parameters for the MySQL link.

                                                +

                                              6. On the Cluster Management page, click Job Management of the cluster and choose Links > Create Link to enter the page for selecting the connector.

                                                Figure 1 Selecting a connector type
                                                +

                                              7. Select MySQL and click Next to configure parameters for the MySQL link.

                                                - - - @@ -102,7 +102,8 @@ - @@ -142,3 +143,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0132.html b/docs/dataartsstudio/umn/dataartsstudio_01_0132.html index 0c63efdc9..ac84a00f4 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0132.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0132.html @@ -1,9 +1,9 @@ -

                                                Managing Drivers

                                                +

                                                Uploading a CDM Link Driver

                                                The Java Database Connectivity (JDBC) provides programmatic access to relational databases. Applications can execute SQL statements and retrieve data using the JDBC API.

                                                Before connecting CDM to a relational database, you need to upload the JDK 8 .jar driver of the relational database.

                                                -

                                                Prerequisites

                                                • A cluster has been created.
                                                • You have downloaded one of the drivers listed in Table 1.
                                                • (Optional) An SFTP link has been created by referring to Link to an FTP or SFTP Server and the corresponding driver has been uploaded to the offline file server.
                                                +

                                                Prerequisites

                                                • A cluster has been created.
                                                • You have downloaded one of the drivers listed in Table 1.
                                                • (Optional) An SFTP link has been created by referring to FTP/SFTP Link Parameters and the corresponding driver has been uploaded to the offline file server.

                                                How Do I Obtain a Driver?

                                                Select a driver version that adapts to the database type. Note that the version of the uploaded driver does not need to match the version of the database to be connected. Obtain the JDK8 .jar driver of the recommended version by referring to Table 1.

                                                @@ -58,27 +58,19 @@
                                                - - - - - - - - @@ -89,14 +81,21 @@
                                                Table 1 MySQL link parameters

                                                Parameter

                                                Description

                                                @@ -67,9 +67,9 @@

                                                Use Agent

                                                Whether to extract data from the data source through an agent

                                                +

                                                The agent function will be unavailable soon and does not need to be configured.

                                                Yes

                                                +

                                                -

                                                local_infile Character Set

                                                @@ -88,7 +88,7 @@

                                                Agent

                                                Click Select and select the created agent.

                                                +

                                                The agent function will be unavailable soon and does not need to be configured.

                                                -

                                                Commit Size

                                                Obtaining data from the source through the agent

                                                +

                                                (Optional) Displayed when you click Show Advanced Attributes.

                                                +

                                                Number of records submitted each time. Set this parameter based on the destination and data size of the job. If the value is too large or too small, the job execution time may be affected.

                                                1000

                                                sqljdbc42.jar

                                                DM

                                                +

                                                Dameng database

                                                DM

                                                Obtain DmJdbcDriver18.jar from the DM installation directory /dmdbms/drivers/jdbc.

                                                +

                                                https://eco.dameng.com/download/

                                                +

                                                Obtain DmJdbcDriver18.jar from the DM installation directory /dmdbms/drivers/jdbc.

                                                DmJdbcDriver18.jar

                                                Doris

                                                -

                                                MYSQL

                                                -

                                                https://downloads.mysql.com/archives/c-j/

                                                -

                                                mysql-connector-java-5.1.48.jar

                                                -

                                                POSTGRESQL_KINGBASE

                                                KINGBASE

                                                +

                                                POSTGRESQL_KINGBASE

                                                https://www.kingbase.com.cn/rjcxxz/index.htm

                                              -

                                              Procedure

                                              1. Access the CDM console, choose Cluster Management in the navigation pane, locate the target cluster, and choose Job Management > Link Management > Driver Management. On the Driver Management page, upload a driver.

                                                Figure 1 Uploading a driver
                                                +

                                                Procedure

                                                1. Access the CDM console, choose Cluster Management in the navigation pane, locate the target cluster, and choose Job Management > Link Management > Driver Management. On the Driver Management page, upload a driver.

                                                  Figure 1 Uploading a driver

                                                2. Click Upload in the Operation column and select a local driver.

                                                  Alternatively, click Copy from SFTP in the Operation column and configure the SFTP Link name and Driver File Path.

                                                3. (Optional) If you have uploaded an updated version of a driver, you must restart the CDM cluster for the new driver to take effect.
                                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0133.html b/docs/dataartsstudio/umn/dataartsstudio_01_0133.html index ea5ceb385..a6e1bd053 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0133.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0133.html @@ -12,7 +12,7 @@

                                            -

                                            Creating an Oracle Link

                                            1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.
                                            2. Select Oracle and click Next to configure parameters for the link.

                                              Figure 1 Creating an Oracle link
                                              +

                                              Creating an Oracle Link

                                              1. Click Job Management in the Operation column of the CDM cluster. On the displayed page, click the Links tab and then Create Link. The Select Connector page is displayed.
                                              2. Select Oracle and click Next to configure parameters for the link.

                                                Figure 1 Creating an Oracle link
                                                @@ -73,14 +73,14 @@ - - - @@ -178,14 +178,14 @@ - - - @@ -202,12 +202,12 @@

                                              3. Click Save.
                                              4. -

                                                Creating a Migration Job

                                                1. Choose Table/File Migration > Create Job to create a job for exporting data from the Oracle database to DWS.

                                                  Figure 2 Creating a job for migrating data from Oracle to DWS
                                                  +

                                                  Creating a Migration Job

                                                  1. Choose Table/File Migration > Create Job to create a job for exporting data from the Oracle database to DWS.

                                                    Figure 2 Creating a job for migrating data from Oracle to DWS
                                                    • Job Name: Enter a unique name.
                                                    • Source Job Configuration
                                                      • Source Link Name: Select the oracle_link created in Creating an Oracle Link.
                                                      • Schema/Tablespace: Enter the name of the database whose data is to be migrated.
                                                      • Table Name: Enter the name of the table whose data is to be migrated.
                                                      • Retain the default values of the optional parameters in Show Advanced Attributes.
                                                    • Destination Job Configuration
                                                      • Destination Link Name: Select the dwslink created in Creating a DWS Link.
                                                      • Schema/Tablespace: Select the DWS database to which data is to be written.
                                                      • Auto Table Creation: This parameter is displayed only when both the migration source and destination are relational databases.
                                                      • Table Name: Name of the table to which data is to be written. You can enter a table name that does not exist. CDM automatically creates the table in DWS.
                                                      • Orientation: You can create row- or column-store tables as needed. Generally, if a table contains many columns (called a wide table) and its query involves only a few columns, column storage is recommended. If a table contains only a few columns and a query includes most of the fields, row storage is recommended.
                                                      • Extend char length: If the data encoding formats of the migration source and destination are different, the character length of the automatic table creation may be insufficient. If you select Yes for this parameter, the character length will be increased by three times during automatic table creation.
                                                      • Clear Data Before Import: whether to clear data in the destination table before the migration task starts.

                                                  2. Click Next. The Map Field page is displayed. CDM automatically matches the source and destination fields, as shown in Figure 3.

                                                    • If the field mapping is incorrect, you can drag the fields to adjust the mapping.
                                                    • The expressions in CDM support field conversion of common character strings, dates, and values.
                                                    -
                                                    Figure 3 Table-to-table field mapping
                                                    +
                                                    Figure 3 Table-to-table field mapping

                                                  3. Click Next and set task parameters. Generally, retain the default values of all parameters.

                                                    In this step, you can configure the following optional functions:
                                                    • Retry Upon Failure: If the job fails to be executed, you can determine whether to automatically retry. Retain the default value Never.
                                                    • Group: Select the group to which the job belongs. The default group is DEFAULT. On the Job Management page, jobs can be displayed, started, or exported by group.
                                                    • Schedule Execution: Enable it if you need to configure scheduled jobs. Retain the default value No.
                                                    • Concurrent Extractors: Enter the number of extractors to be concurrently executed. You can increase the value of this parameter to improve migration efficiency.
                                                    • Write Dirty Data: Dirty data may be generated during data migration between tables. You are advised to select Yes.
                                                    • Delete Job After Completion: Retain the default value Do not delete.

                                                  4. Click Save and Run. The Job Management page is displayed, on which you can view the job execution progress and result.
                                                  5. After the job is successfully executed, in the Operation column of the job, click Historical Record to view the job's historical execution records and read/write statistics.

                                                    On the Historical Record page, click Log to view the job logs.

                                                    @@ -222,3 +222,10 @@
                                                + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0011.html b/docs/dataartsstudio/umn/dataartsstudio_01_0134.html similarity index 50% rename from docs/dataartsstudio/umn/dataartsstudio_01_0011.html rename to docs/dataartsstudio/umn/dataartsstudio_01_0134.html index 9712af4be..6624b1600 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0011.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0134.html @@ -1,17 +1,17 @@ - + -

                                                Managing a Workspace

                                                -
                                                +

                                                Creating and Configuring a Workspace in Simple Mode

                                                +
                                                diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0136.html b/docs/dataartsstudio/umn/dataartsstudio_01_0136.html deleted file mode 100644 index b8927dffe..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0136.html +++ /dev/null @@ -1,79 +0,0 @@ - - -

                                                From Doris

                                                -

                                                If the source link of a job is a Doris link, configure the source job parameters based on Table 1.

                                                - -
                                                Table 1 Oracle link parameters

                                                Parameter

                                                Use Agent

                                                Whether to extract data from the data source through an agent

                                                +

                                                The agent function will be unavailable soon and does not need to be configured.

                                                Yes

                                                +

                                                -

                                                Agent

                                                Click Select and select the created agent.

                                                +

                                                The agent function will be unavailable soon and does not need to be configured.

                                                -

                                                Use Agent

                                                Whether to extract data from the data source through an agent

                                                +

                                                The agent function will be unavailable soon and does not need to be configured.

                                                Yes

                                                +

                                                -

                                                Agent

                                                Click Select and select the created agent.

                                                +

                                                The agent function will be unavailable soon and does not need to be configured.

                                                -

                                                - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
                                                Table 1 Parameter description

                                                Type

                                                -

                                                Parameter

                                                -

                                                Description

                                                -

                                                Example Value

                                                -

                                                Basic parameters

                                                -

                                                Use SQL Statement

                                                -

                                                Whether to use SQL statements to extract source data

                                                -

                                                No

                                                -

                                                Schema/Tablespace

                                                -

                                                Name of the database to which data will be written. The schema can be automatically created. Click the icon next to the text box to select a schema or tablespace.

                                                -

                                                schema

                                                -

                                                Table Name

                                                -

                                                Name of the table from which data will be read. Click the button next to the text box. The dialog box for selecting the table is displayed.

                                                -

                                                This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                                -
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Factory of DataArts Studio, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                -
                                                -

                                                table

                                                -

                                                Where Clause

                                                -

                                                If you set Use SQL Statement to No, you can add a where clause to add filter criteria.

                                                -

                                                age > 18 and age <= 60

                                                -

                                                Partition Column

                                                -

                                                Column used to split data during data extraction to implement parallel extraction

                                                -

                                                id

                                                -

                                                Null in Partition Column

                                                -

                                                During concurrent extraction, if the partition column does not contain null, set this parameter to No to improve performance. If you are not sure whether the partition column contains null, set this parameter to Yes to avoid data loss.

                                                -

                                                No

                                                -

                                                Regain Symbol (in OBT)

                                                -

                                                Field as the resumable transfer flag. The source field is an incremental value or timestamp, and the destination field is of the same type as the source field.

                                                -

                                                id

                                                -
                                                -
                                                -
                                              -
                                              - -
                                              - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0137.html b/docs/dataartsstudio/umn/dataartsstudio_01_0137.html new file mode 100644 index 000000000..7b3375213 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0137.html @@ -0,0 +1,19 @@ + + +

                                              HBase/CloudTable Incremental Migration

                                              +

                                              You can use CDM to export data in a specified period of time from HBase (including MRS HBase, FusionInsight HBase, and Apache HBase) and CloudTable. The CDM scheduled jobs can be used together to implement incremental migration of HBase and CloudTable.

                                              +

                                              If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                              +
                                              +

                                              When creating a table/file migration job and selecting the link to HBase or CloudTable as the source link, you can set the time range in advanced attributes.

                                              +
                                              Figure 1 Time range
                                              +
                                              • Start time (including the value) for extracting data. The format is yyyy-MM-dd HH:mm:ss. Only the data generated at the specified time and later is extracted.
                                              • End time (excluding the value) for extracting data. The format is yyyy-MM-dd HH:mm:ss. Only the data generated before the time point is extracted.
                                              +

                                              The two parameters can be set to macro variables of date and time. Examples are as follows:

                                              +
                                              • If Minimum Timestamp is set to ${dateformat(yyyy-MM-dd HH:mm:ss, -1, DAY)}, only the data generated after the day before is exported.
                                              • If Maximum Timestamp is set to ${dateformat(yyyy-MM-dd HH:mm:ss)}, only the data generated before the specified time point is exported.
                                              +

                                              If both parameters are configured, CDM exports only the data generated on the previous day. In addition, if the job is configured to execute at 00:00:00 every day, the data generated every day can be incrementally synchronized.

                                              +
                                              +
                                              + +
                                              + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0138.html b/docs/dataartsstudio/umn/dataartsstudio_01_0138.html new file mode 100644 index 000000000..89f9754c5 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0138.html @@ -0,0 +1,20 @@ + + +

                                              Creating a DataArts Studio Incremental Package

                                              +

                                              +
                                              + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0139.html b/docs/dataartsstudio/umn/dataartsstudio_01_0139.html new file mode 100644 index 000000000..0b1347339 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0139.html @@ -0,0 +1,34 @@ + + +

                                              Introduction to Incremental Packages

                                              +

                                              DataArts Studio provides basic and incremental packages. If the basic package cannot meet your demands, you need to create an incremental package.

                                              +

                                              DataArts Studio Incremental Packages

                                              Table 1 lists the incremental packages provided by DataArts Studio.

                                              + +
                                              + + + + + + + + + +
                                              Table 1 Incremental packages

                                              Package Type

                                              +

                                              Description

                                              +

                                              Scenario

                                              +

                                              DataArts Migration incremental package

                                              +

                                              A DataArts Migration (that is, CDM) incremental package provides resources for a CDM cluster. When you create a CDM incremental package, the system automatically creates a CDM cluster based on the specifications you select for the incremental package.

                                              +
                                              CDM clusters can be used in the following scenarios:
                                              • Data migration jobs can be created and run in CDM clusters to migrate data to the cloud or import data to the data lake.
                                              • CDM clusters can be used as agents of data connections in Management Center, which enable communications between DataArts Studio instances and data sources.
                                              +
                                              +

                                              A DataArts Studio instance does not contain CDM clusters. To use CDM clusters, create DataArts Migration incremental packages.

                                              +
                                              +
                                              +
                                              +
                                              + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0145.html b/docs/dataartsstudio/umn/dataartsstudio_01_0145.html new file mode 100644 index 000000000..4756ddc02 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0145.html @@ -0,0 +1,88 @@ + + +

                                              Creating a DataArts Migration Resource Group Incremental Package

                                              +

                                              This type of incremental package provides resource groups for real-time jobs in DataArts Migration. DataArts Migration resource groups can be used to migrate data to the cloud and ingest data into and export data out of a data lake. It provides wizard-based configuration and management and can migrate all and incremental data from a single table, entire database, or database or table shard.

                                              +

                                              DataArts Migration resource groups can be used in the following scenarios:

                                              +

                                              They can be used to create and run real-time processing migration jobs to migrate data to the cloud or ingest data into the data lake.

                                              +

                                              By default, a DataArts Studio instance does not contain DataArts Migration resource groups. If you want to migrate data in real time, create a DataArts Migration resource group incremental package.

                                              +

                                              Context

                                              • When you create a DataArts Migration resource group incremental package, the system automatically creates a resource group required by real-time data integration jobs based on the specifications you set for the incremental package.
                                              • When buying a DataArts Migration resource group incremental package (pay-per-use resource package), pay attention to the following:
                                                • When you buy a DataArts Migration resource group incremental package which is billed based on a pay-per-use package, the system does not automatically create a resource group for real-time processing migration jobs. Instead, you can use a resource group you have obtained on the DataArts Studio console for 745 hours each month within the validity period of the incremental package and in a specified region.
                                                • If you have one or more resource groups in a region, the duration quota of your resource package will be deducted first. Any usage beyond the quota will be billed in pay-per-use mode. (If a resource package is shared by multiple clusters, the available package duration may be insufficient in each subscription period.)

                                                  For example, if you purchase a one-month package (745 hours/month) and two resources are associated with the package, 372.5 hours (about 15.5 days) can be allocated to each resource group within the one-month subscription. Any usage beyond the allocated hours will be billed in pay-per-use mode.

                                                  +
                                                • If you purchase a package and do not associate it with any resource group, the duration quota in the package will not be consumed and the validity period of the package will not be extended as well. Therefore, you are advised to make a plan before buying a package.
                                                • If you want to enjoy the preferential price of the yearly/monthly incremental package, you can buy a yearly/monthly incremental package and then buy a pay-per-use incremental package which is in the same region and has the same specifications as the yearly/monthly incremental package.
                                                • If you buy a pay-per-use incremental package and then a yearly/monthly incremental package in the same region and with the same specifications as the pay-per-use incremental package, the fees generated before you buy the yearly/monthly incremental package are charged in pay-per-use mode, and the subsequent fees are charged based on the yearly/monthly incremental package.
                                                + +
                                              • You can locate a DataArts Studio instance, click More, and select View Packages to view your incremental packages.
                                              • The prices of resource groups vary depending on their specifications. For details, see . You can also access the of DataArts Studio and select a region and specifications to quickly obtain the price of a resource group.
                                              +
                                              +

                                              Creating a DataArts Migration Resource Group

                                              1. You can buy a resource group in either of the following ways:
                                                • Method 1

                                                  Locate an enabled instance and click Create.

                                                  +
                                                  Figure 1 Incremental package
                                                  +
                                                • Method 2
                                                  1. Locate an instance and click Access.
                                                  2. In the upper right corner, click Buy.
                                                  +
                                                • Method 3
                                                  1. Locate an instance, click More, and select Resources.
                                                    Figure 2 Accessing Resources
                                                    +
                                                  2. On the Real-Time Resources tab page, click Buy Resource Group.
                                                    Figure 3 Buying a resource group
                                                    +
                                                  +
                                                +
                                              1. On the displayed page, set parameters based on Table 1.
                                                Figure 4 Creating a DataArts Migration resource group
                                                + +
                                                + + + + + + + + + + + + + + + + + + + + + + +
                                                Table 1 Parameters for the DataArts Migration resource group incremental package

                                                Parameter

                                                +

                                                Description

                                                +

                                                Package

                                                +

                                                DataArts Migration resource group

                                                +

                                                Name

                                                +

                                                Enter the resource group name.

                                                +

                                                Description

                                                +

                                                Enter a description for the DataArts Migration resource group.

                                                +

                                                Specifications

                                                +

                                                Select the specifications for the resource group, including the CU value, applicable environment, and maximum number of jobs that can be created.

                                                +

                                                The maximum number of migration tasks or jobs that can be created varies depending on the resource group specifications. Select the specifications that suit your needs. A maximum of 50 tables can be created for a single job (at least 2 CUs are required).

                                                +

                                                Small: 16 CUs and a maximum of 7 jobs This option is applicable to tests and does not support high availability. It is not recommended.

                                                +

                                                Medium: 64 CUs and a maximum of 32 jobs

                                                +

                                                Large: 96 CUs and a maximum of 48 jobs

                                                +

                                                Super-large: 128 CUs and a maximum of 64 jobs

                                                +

                                                Network Segment

                                                +

                                                Recommended network segments:

                                                +
                                                • 10.0.0.0–10.255.0.0/8–19
                                                • 172.16.0.0–172.31.0.0/12–19
                                                • 192.168.0.0~192.168.0.0/16 ~19
                                                  NOTE:
                                                  • To use VPC peering connections, set a network segment that does not overlap with that of the source and destination cluster or instance. If they overlap, the network will be disconnected.
                                                  • Restricted by the CCE logic, the maximum length of the network segment mask is 19 bits. Network segments with a mask longer than 20 bits are not supported.
                                                  +
                                                  +
                                                +

                                                Discount Quota (Hour)

                                                +

                                                A discount package is prepaid by month or year. Compared with pay-per-use billing, the fee is reduced by 15% to 29%.

                                                +
                                                +
                                                +
                                                • You cannot modify the specifications of an existing resource group. If you need higher specifications, create another resource group.
                                                • A pay-per-use resource package in use cannot be unsubscribed from. For details, see .
                                                +
                                                +
                                              2. Click Create Now, confirm the settings, and click Next. If the resource group fails to be created and a quota issue is displayed, contact the service personnel to apply for a quota.
                                              3. Go to the corresponding workspace to view the DataArts Migration resource group you have created.
                                              +
                                              +
                                              1. On the displayed page, set the following parameters:
                                                1. Select DataArts Migration resource group for Package.
                                                2. Select Pay-per-Use Package for Billing Mode.
                                                3. Specify a validity period in Required Duration for the package.
                                                4. Enter the number of subscribed packages in Quantity. For example, if you set Required Duration to 1 month and Quantity to 2, you will have a 1,490-hour quota in one month.
                                                +
                                              2. Click Buy Now, confirm the specifications, and click Next.
                                              3. After you buy this package, the system will not automatically create a DataArts Migration resource group. You need to buy a pay-per-use incremental package in the same region and with the same specifications as this package by following the instructions in Creating a DataArts Migration Resource Group. Then you can enjoy the favorable price of this package.
                                              +
                                              + + + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0157.html b/docs/dataartsstudio/umn/dataartsstudio_01_0157.html new file mode 100644 index 000000000..5725a13ae --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0157.html @@ -0,0 +1,71 @@ + + + +

                                              Configuring Link Parameters

                                              + +

                                              +
                                              + +
                                              + + + +
                                              + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0184.html b/docs/dataartsstudio/umn/dataartsstudio_01_0184.html index 6abd70024..603e33c48 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0184.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0184.html @@ -1,6 +1,6 @@ -

                                              Link to MRS Hudi

                                              +

                                              MRS Hudi Link Parameters

                                              Table 1 describes the MRS Hudi link parameters.

                                              Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

                                              @@ -22,7 +22,7 @@

                                            Manager IP

                                            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
                                            NOTE:

                                            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                            +
                                            Floating IP address of MRS Manager. Click Select next to the Manager IP text box to select an MRS cluster. CDM automatically fills in the authentication information.
                                            NOTE:

                                            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                            This parameter is available when OBS storage support is set to Yes.

                                            AK and SK are used to log in to the OBS server.

                                            You need to create an access key for the current account and obtain an AK/SK pair.

                                            -
                                            To obtain an access key, perform the following steps:
                                            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
                                              Figure 1 Clicking Create Access Key
                                              +
                                              To obtain an access key, perform the following steps:
                                              1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                              2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
                                                Figure 1 Clicking Create Access Key
                                              3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                                                NOTE:
                                                • Only two access keys can be added for each user.
                                                • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
                                              @@ -100,7 +100,14 @@
                                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0185.html b/docs/dataartsstudio/umn/dataartsstudio_01_0185.html index e75b32c64..1094ab98f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0185.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0185.html @@ -33,7 +33,7 @@

                                            Hudi table name. Click the icon next to the text box. The dialog box for selecting the table is displayed.

                                            You can set a macro variable of date and time, and a path name can contain multiple macro variables. You can use macro variables of date and time in a scheduled job to synchronize incremental data periodically. For details, see Using Macro Variables of Date and Time.

                                            -
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            +
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            TBL_E

                                            @@ -45,7 +45,7 @@

                                            This parameter indicates the where clause to be extracted. If this parameter is not set, the entire table is extracted. If the table to be migrated does not contain the fields specified by the where clause, the migration will fail.

                                            You can set a macro variable of date and time to extract the data generated on a specific date. For details, see Incremental Migration of Relational Databases.

                                            -
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            +
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            age > 18 and age <= 60

                                            @@ -57,7 +57,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0186.html b/docs/dataartsstudio/umn/dataartsstudio_01_0186.html index a92b149c4..44ef201a9 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0186.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0186.html @@ -3,19 +3,19 @@

                                            To MRS Hudi

                                            If the destination link of a job is an MRS Hudi link, configure the destination job parameters based on Table 1.

                                            -
                                            - - - @@ -326,7 +326,7 @@ - @@ -372,7 +372,7 @@ - @@ -396,7 +396,7 @@ - @@ -407,7 +407,7 @@ - @@ -835,7 +835,7 @@ - @@ -1062,7 +1062,7 @@ - @@ -1358,7 +1358,7 @@ - @@ -1369,7 +1369,7 @@ - @@ -1467,7 +1467,7 @@ - - - - @@ -1758,7 +1757,7 @@ - - - @@ -102,15 +105,17 @@ - - @@ -135,9 +140,9 @@
                                            Table 1 Parameter description

                                            Category

                                            +
                                            - - - - - - - @@ -179,7 +179,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0196.html b/docs/dataartsstudio/umn/dataartsstudio_01_0196.html index b49f57835..5ab08ec69 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0196.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0196.html @@ -1,7 +1,7 @@

                                            Supported Data Sources (2.10.0.300)

                                            -
                                            CDM provides the following migration modes which support different data sources: +
                                            CDM provides the following migration modes which support different data sources:

                                            This section describes the data sources supported by CDM clusters of version 2.10.0.300. The supported data sources vary depending on the CDM cluster version.

                                            @@ -18,27 +18,28 @@
                                            - - - - @@ -46,20 +47,20 @@ - - - @@ -68,7 +69,7 @@ - - - - - - - - - - - - @@ -135,89 +120,54 @@ - - - - - - - - - - - - - - - - + - - - - - - - - - - - - - - - - - - - - - - - - @@ -238,23 +188,111 @@ - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + @@ -290,7 +328,7 @@ - - - - - - - - - - - - @@ -424,25 +441,7 @@ - - - - - - - - - - - @@ -453,22 +452,68 @@ - - - - + - - - - + + + + + + + + + + + + + + + + + + + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0197.html b/docs/dataartsstudio/umn/dataartsstudio_01_0197.html deleted file mode 100644 index 32242c048..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0197.html +++ /dev/null @@ -1,486 +0,0 @@ - - -

                                            Supported Data Sources (2.10.0.100)

                                            -
                                            CDM provides the following migration modes which support different data sources: -
                                            -

                                            This section describes the data sources supported by CDM clusters of version 2.10.0.100. The supported data sources vary depending on the CDM cluster version.

                                            -
                                            -

                                            Data Sources Supported by Table/File Migration

                                            Table/File migration can migrate data in tables or files.

                                            -
                                            Table 1 describes the supported data sources. -
                                            Table 1 Parameter description

                                            Type

                                            Parameter

                                            +

                                            Parameter

                                            Description

                                            +

                                            Description

                                            Example Value

                                            +

                                            Example Value

                                            Basic parameters

                                            +

                                            Basic parameters

                                            Destination Link Name

                                            +

                                            Destination Link Name

                                            MRS Hudi link

                                            @@ -34,7 +34,7 @@

                                            Click the icon next to the text box. The dialog box for selecting the table is displayed.

                                            This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. You can use macro variables of date and time in a scheduled job to synchronize incremental data periodically. For details, see Using Macro Variables of Date and Time.

                                            -
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            +
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            cdm

                                            @@ -91,9 +91,9 @@

                                            cdc_last_update_date

                                            Hudi Table Creation parameters

                                            +

                                            Hudi table creation parameters

                                            Location

                                            +

                                            Location

                                            OBS or HDFS path where database table files are stored

                                            Data warehouse

                                            +

                                            GaussDB(DWS)

                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), Doris, and MRS ClickHouse
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), Doris, and MRS ClickHouse
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable

                                            The DWS physical machine management mode is not supported.

                                            Data Lake Insight (DLI)

                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), Doris, and MRS ClickHouse
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable and MongoDB
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), Doris, and MRS ClickHouse
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: MongoDB
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable

                                            Recommended MongoDB version:

                                            -

                                            4.2

                                            +

                                            Recommended MongoDB version: 4.2

                                            +

                                            You must have the SELECT permission (for querying tables) on all fields of the DLI data source.

                                            MRS ClickHouse

                                            Data warehouse: MRS ClickHouse and Data Lake Insight (DLI)

                                            • Recommended MRS ClickHouse version: 21.3.4.X
                                            • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                              +
                                            • Recommended MRS ClickHouse version: 21.3.4.X
                                            • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            Data warehouses: Doris

                                            -

                                            +

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            Hadoop

                                            +

                                            Hadoop

                                            MRS HDFS

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable
                                            • Supported by local storage. Only MRS Hive and MRS Hudi are supported in storage-compute decoupling scenarios.
                                            • Only MRS Hive is supported in Ranger scenarios.
                                            • Not supported if SSL is enabled for ZooKeeper
                                            • Recommended MRS HDFS versions:
                                              • 2.8.X
                                              • 3.1.X
                                            • Recommended MRS HBase versions:
                                              • 2.1.X
                                              • 1.3.X
                                            • MRS Hive and MRS Hudi 2.x versions are not supported. The following versions are recommended:
                                              • 1.2.X
                                              • 3.1.X
                                              -
                                            • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                              +
                                            • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            MRS Hive

                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), and MRS ClickHouse
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), Doris, and MRS ClickHouse
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS), CloudTable, and SAP HANA

                                            MRS Hudi

                                            @@ -76,25 +77,9 @@
                                            • Data warehouse: GaussDB(DWS)
                                            • Hadoop: MRS HBase

                                            FusionInsight HDFS

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -
                                            • FusionInsight cannot serve as the destination.
                                            • Supported only by local storage and not in storage-compute decoupling scenarios
                                            • Not supported by Ranger
                                            • Not supported if SSL is enabled for ZooKeeper
                                            • Recommended FusionInsight HDFS versions:
                                              • 2.8.X
                                              • 3.1.X
                                              -
                                            • Recommended FusionInsight HBase versions:
                                              • 2.1.X
                                              • 1.3.X
                                              -
                                            • Recommended FusionInsight Hive versions:
                                              • 1.2.X
                                              • 3.1.X
                                              -
                                            -

                                            FusionInsight HBase

                                            -

                                            FusionInsight Hive

                                            -

                                            Apache HBase

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable
                                            • Apache cannot serve as the destination.
                                            • Supported only by local storage and not in storage-compute decoupling scenarios
                                            • Not supported by Ranger
                                            • Not supported if SSL is enabled for ZooKeeper
                                            • Recommended Apache HBase versions:
                                              • 2.1.X
                                              • 1.3.X
                                            • Apache Hive 2.x versions are not supported. The following versions are recommended:
                                              • 1.2.X
                                              • 3.1.X
                                              @@ -112,7 +97,7 @@

                                            Object Storage Service (OBS)

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable
                                            • Object Storage Migration Service (OMS) is recommended for migration between object storage services.
                                            • Binary files cannot be imported to a database or NoSQL.

                                            @@ -122,7 +107,7 @@

                                            FTP

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            • Object storage: Object Storage Service (OBS)
                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Search: Elasticsearch
                                            • Object storage: Object Storage Service (OBS)
                                            • In OBT: Cloud Search Service (CSS) and CloudTable
                                            • The file system cannot serve as the destination.
                                            • Only text files such as CSV files can be migrated from FTP or SFTP servers to search services. Binary files cannot.
                                            • Only binary files can be migrated from FTP or SFTP servers to OBS.
                                            • obsutil is recommended for migrating data from HTTP servers to OBS.

                                            Hadoop: MRS HDFS

                                            Relational database

                                            +

                                            Relational database

                                            +

                                            RDS for MySQL

                                            +

                                            RDS for MySQL

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, MRS Hive, and MRS Hudi
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), and Doris
                                            • Hadoop: MRS HDFS, MRS HBase, MRS Hive, and MRS Hudi
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS), CloudTable, and SAP HANA
                                            • You are advised to use Data Replication Service (DRS) to migrate data between OLTP databases.
                                            • Recommended Microsoft SQL Server version: 2005 or later
                                            +
                                            • You are advised to use Data Replication Service (DRS) to migrate data between OLTP databases.
                                            • Recommended Microsoft SQL Server version: 2005 or later
                                            • Greenplum, Kingbase, and GaussDB can be connected using the PostgreSQL connector. The supported source and destination are the same as those of the PostgreSQL data source.

                                            RDS for SQL Server

                                            +

                                            RDS for SQL Server

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable

                                            RDS for PostgreSQL

                                            +

                                            RDS for PostgreSQL

                                            MySQL

                                            +

                                            MySQL

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, MRS Hive, and MRS Hudi
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS)
                                            • Hadoop: MRS HDFS, MRS HBase, MRS Hive, and MRS Hudi
                                            • Object storage: Object Storage Service (OBS)
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable

                                            PostgreSQL

                                            +

                                            PostgreSQL

                                            Oracle

                                            +

                                            Oracle

                                            Microsoft SQL Server

                                            +

                                            Microsoft SQL Server

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable

                                            SAP HANA

                                            +

                                            NoSQL

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS Hive
                                            +

                                            Distributed Cache Service (DCS)

                                            SAP HANA data sources have the following restrictions:
                                            • SAP HANA cannot serve as the destination.
                                            • Only the 2.00.050.00.1592305219 version is supported.
                                            • Only the Generic Edition is supported.
                                            • BW/4 FOR HANA is not supported.
                                            • Only database names, table names, and column names consisting of English letters are supported. Special characters such as spaces and symbols are not allowed.
                                            • The following data types are supported: date, digit, Boolean, and character (except SHORTTEXT). Other data types such as binary are not supported.
                                            • During migration, tables cannot be automatically created at the destination.
                                            -
                                            +
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            +

                                            NoSQL cannot serve as the destination.

                                            +

                                            Database sharding

                                            -
                                            • Data warehouse: Data Lake Insight (DLI)
                                            • Hadoop: MRS HBase and MRS Hive
                                            -
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -
                                            • Object storage: Object Storage Service (OBS)
                                            -

                                            Database shards cannot serve as the destination.

                                            +

                                            Redis

                                            ShenTong

                                            -
                                            • Hadoop: MRS Hive and MRS Hudi
                                            -

                                            -

                                            -

                                            NoSQL

                                            -

                                            Distributed Cache Service (DCS)

                                            -

                                            Hadoop: MRS HDFS, MRS HBase, and MRS Hive

                                            -

                                            NoSQL except CloudTable cannot serve as the destination.

                                            -

                                            Redis

                                            -

                                            Document Database Service (DDS)

                                            -

                                            MongoDB

                                            -

                                            CloudTable HBase

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            Cassandra

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +

                                            MongoDB

                                            Message system

                                            @@ -226,7 +176,7 @@

                                            Apache Kafka

                                            Search: Cloud Search Service (CSS)

                                            +

                                            In OBT: Cloud Search Service (CSS)

                                            The message system cannot serve as the destination.

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            • MRS Kafka cannot serve as the destination.
                                            • Supported only by local storage and not in storage-compute decoupling scenarios.
                                            • Not supported by Ranger.
                                            • Not supported if SSL is enabled for ZooKeeper.
                                            • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                              +
                                            • MRS Kafka cannot serve as the destination.
                                            • Supported only by local storage and not in storage-compute decoupling scenarios
                                            • Not supported by Ranger
                                            • Not supported if SSL is enabled for ZooKeeper
                                            • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            Search

                                            +

                                            Search

                                            Elasticsearch

                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • Search: Elasticsearch
                                            • In OBT: CloudTable and Cloud Search Service (CSS)

                                            Only the non-security mode is supported.

                                            Cloud Search Service (CSS)

                                            +

                                            In OBT

                                            +

                                            N/A

                                            +

                                            CloudTable HBase

                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • Search: Elasticsearch
                                            • In OBT: CloudTable and Cloud Search Service (CSS)
                                            +

                                            -

                                            +

                                            Cloud Search Service (CSS)

                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • Search: Elasticsearch
                                            • In OBT: CloudTable and Cloud Search Service (CSS)
                                            +

                                            N/A

                                            +

                                            SAP HANA

                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS Hive
                                            +
                                            SAP HANA data sources have the following restrictions:
                                            • SAP HANA cannot serve as the destination.
                                            • Only the 2.00.050.00.1592305219 version is supported.
                                            • Only the Generic Edition is supported.
                                            • BW/4 FOR HANA is not supported.
                                            • Only database names, table names, and column names consisting of English letters are supported. Special characters such as spaces and symbols are not allowed.
                                            • The following data types are supported: date, digit, Boolean, and character (except SHORTTEXT). Other data types such as binary are not supported.
                                            • During migration, tables cannot be automatically created at the destination.
                                            +
                                            +

                                            FusionInsight HDFS

                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable
                                            +

                                            +
                                            • FusionInsight cannot serve as the destination.
                                            • Supported only by local storage and not in storage-compute decoupling scenarios
                                            • Not supported by Ranger
                                            • Not supported if SSL is enabled for ZooKeeper
                                            • Recommended FusionInsight HDFS versions:
                                              • 2.8.X
                                              • 3.1.X
                                              +
                                            • Recommended FusionInsight HBase versions:
                                              • 2.1.X
                                              • 1.3.X
                                              +
                                            • Recommended FusionInsight Hive versions:
                                              • 1.2.X
                                              • 3.1.X
                                              +
                                            +

                                            FusionInsight HBase

                                            +

                                            FusionInsight Hive

                                            +

                                            Database shard

                                            +
                                            • Data warehouse shard: Data Lake Insight (DLI)
                                            • Hadoop: MRS HBase and MRS Hive
                                            +
                                            • Search: Elasticsearch
                                            +
                                            • Object storage: Object Storage Service (OBS)
                                            • In OBT: Cloud Search Service (CSS)
                                            +

                                            Database shards cannot serve as the destination.

                                            +

                                            Dameng database

                                            +
                                            • Data warehouse: GaussDB(DWS)
                                            • Hadoop: MRS Hive and MRS Hudi
                                            +

                                            -

                                            +

                                            ShenTong

                                            +

                                            Hadoop: MRS Hive and MRS Hudi

                                            +

                                            -

                                            +

                                            Document Database Service (DDS)

                                            +

                                            Hadoop: MRS HDFS, MRS HBase, and MRS Hive

                                            +

                                            -

                                            +

                                            Cassandra

                                            +
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Search: Elasticsearch
                                            • In OBT: Cloud Search Service (CSS) and CloudTable
                                            +

                                            -

                                            +

                                            GBASE8S

                                            +
                                            • Hadoop: MRS HDFS and MRS HBase
                                            • Message system: MRS Kafka
                                            +

                                            -

                                            +

                                            GBASE8A

                                            +
                                            • Hadoop: MRS HDFS, MRS Hive, and MRS HBase
                                            • Message system: MRS Kafka
                                            +

                                            -

                                            -

                                            Hadoop

                                            +

                                            Hadoop

                                            (available only for local storage, and not for storage-compute decoupling, Ranger, or ZooKeeper for which SSL is enabled)

                                            MRS HBase

                                            @@ -302,7 +340,7 @@

                                            Entire DB migration only to MRS HBase

                                            Recommended versions:
                                            • 2.1.X
                                            • 1.3.X
                                            -

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            +

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            MRS Hive

                                            @@ -314,28 +352,7 @@

                                            Entire DB migration only to a relational database

                                            2.x versions are not supported. The following versions are recommended:
                                            • 1.2.X
                                            • 3.1.X
                                            -

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            -

                                            FusionInsight HBase

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -
                                            Recommended versions:
                                            • 2.1.X
                                            • 1.3.X
                                            -
                                            -

                                            FusionInsight Hive

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -

                                            Entire DB migration only to a relational database

                                            -
                                            2.x versions are not supported. The following versions are recommended:
                                            • 1.2.X
                                            • 3.1.X
                                            -
                                            +

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            Apache HBase

                                            @@ -368,10 +385,10 @@

                                            Supported only by local storage and in storage-compute decoupling scenarios

                                            2.x versions are not supported. The following versions are recommended:

                                            • 1.2.X
                                            • 3.1.X
                                            -

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            +

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            Relational database

                                            +

                                            Relational database

                                            RDS for MySQL

                                            Not supported

                                            SAP HANA

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -
                                            • Only the 2.00.050.00.1592305219 version is supported.
                                            • Only the Generic Edition is supported.
                                            • BW/4 FOR HANA is not supported.
                                            • Only database names, table names, and column names consisting of English letters are supported. Special characters such as spaces and symbols are not allowed.
                                            • The following data types are supported: date, digit, Boolean, and character (except SHORTTEXT). Other data types such as binary are not supported.
                                            • During migration, tables cannot be automatically created at the destination.
                                            -

                                            Dameng database

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -

                                            Only to DWS and Hive

                                            -

                                            NoSQL

                                            +

                                            NoSQL

                                            Distributed Cache Service (DCS)

                                            Only migration from MRS to DCS is supported.

                                            Document Database Service (DDS)

                                            +

                                            In OBT

                                            +

                                            +

                                            +

                                            +

                                            +

                                            Supported

                                            +

                                            CloudTable

                                            Supported

                                            +

                                            Supported

                                            Only migration between DDS and MRS is supported.

                                            +

                                            Supported

                                            +

                                            -

                                            CloudTable

                                            +

                                            FusionInsight HBase

                                            Supported

                                            +

                                            Supported

                                            Supported

                                            +

                                            Not supported

                                            -

                                            +
                                            Recommended versions:
                                            • 2.1.X
                                            • 1.3.X
                                            +
                                            +

                                            FusionInsight Hive

                                            +

                                            Supported

                                            +

                                            Not supported

                                            +

                                            Entire DB migration only to a relational database

                                            +
                                            2.x versions are not supported. The following versions are recommended:
                                            • 1.2.X
                                            • 3.1.X
                                            +
                                            +

                                            SAP HANA

                                            +

                                            Supported

                                            +

                                            Not supported

                                            +
                                            • Only the 2.00.050.00.1592305219 version is supported.
                                            • Only the Generic Edition is supported.
                                            • BW/4 FOR HANA is not supported.
                                            • Only database names, table names, and column names consisting of English letters are supported. Special characters such as spaces and symbols are not allowed.
                                            • The following data types are supported: date, digit, Boolean, and character (except SHORTTEXT). Other data types such as binary are not supported.
                                            • During migration, tables cannot be automatically created at the destination.
                                            +

                                            Dameng database

                                            +

                                            Supported

                                            +

                                            Not supported

                                            +

                                            Only to DWS and Hive

                                            +

                                            Document Database Service (DDS)

                                            +

                                            Supported

                                            +

                                            Supported

                                            +

                                            Only migration between DDS and MRS is supported.

                                            - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
                                            Table 1 Supported data sources during table/file migration

                                            Category

                                            -

                                            Source

                                            -

                                            Destination

                                            -

                                            Description

                                            -

                                            Data warehouse

                                            -

                                            -

                                            GaussDB(DWS)

                                            -
                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), Doris, and MRS ClickHouse
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            The DWS physical machine management mode is not supported.

                                            -

                                            Data Lake Insight (DLI)

                                            -
                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), Doris, and MRS ClickHouse
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable and MongoDB
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            Recommended MongoDB version:

                                            -

                                            4.2

                                            -

                                            MRS ClickHouse

                                            -

                                            Data warehouse: MRS ClickHouse and Data Lake Insight (DLI)

                                            -
                                            • Recommended MRS ClickHouse version: 21.3.4.X
                                            -
                                            • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                              -
                                            -

                                            Doris

                                            -

                                            Data warehouses: Doris

                                            -

                                            -

                                            -

                                            Hadoop

                                            -

                                            -

                                            MRS HDFS

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -
                                            • Supported by local storage. Only MRS Hive and MRS Hudi are supported in storage-compute decoupling scenarios.
                                            • Only MRS Hive is supported in Ranger scenarios.
                                            • Not supported if SSL is enabled for ZooKeeper
                                            • Recommended MRS HDFS versions:
                                              • 2.8.X
                                              • 3.1.X
                                              -
                                            • Recommended MRS HBase versions:
                                              • 2.1.X
                                              • 1.3.X
                                              -
                                            • MRS Hive and MRS Hudi 2.X versions are not supported. The following versions are recommended:
                                              • 1.2.X
                                              • 3.1.X
                                              -
                                            • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                              -
                                            -

                                            MRS HBase

                                            -

                                            MRS Hive

                                            -
                                            • Data warehouse: GaussDB(DWS), Data Lake Insight (DLI), and MRS ClickHouse
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            MRS Hudi

                                            -
                                            • Data warehouse: GaussDB(DWS)
                                            • Hadoop: MRS HBase
                                            -

                                            FusionInsight HDFS

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -
                                            • FusionInsight cannot serve as the destination.
                                            • Supported only by local storage and not in storage-compute decoupling scenarios
                                            • Not supported by Ranger
                                            • Not supported if SSL is enabled for ZooKeeper
                                            • Recommended FusionInsight HDFS versions:
                                              • 2.8.X
                                              • 3.1.X
                                              -
                                            • Recommended FusionInsight HBase versions:
                                              • 2.1.X
                                              • 1.3.X
                                              -
                                            • Recommended FusionInsight Hive versions:
                                              • 1.2.X
                                              • 3.1.X
                                              -
                                            -

                                            FusionInsight HBase

                                            -

                                            FusionInsight Hive

                                            -

                                            Apache HBase

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -
                                            • Apache cannot serve as the destination.
                                            • Supported only by local storage and not in storage-compute decoupling scenarios
                                            • Not supported by Ranger
                                            • Not supported if SSL is enabled for ZooKeeper
                                            • Recommended Apache HBase versions:
                                              • 2.1.X
                                              • 1.3.X
                                              -
                                            • Apache Hive 2.X versions are not supported. The following versions are recommended:
                                              • 1.2.X
                                              • 3.1.X
                                              -
                                            • Recommended Apache HDFS versions:
                                              • 2.8.X
                                              • 3.1.X
                                              -
                                            -

                                            Apache Hive

                                            -

                                            Apache HDFS

                                            -

                                            Object storage

                                            -

                                            Object Storage Service (OBS)

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -
                                            • Object Storage Migration Service (OMS) is recommended for migration between object storage services.
                                            • Binary files cannot be imported to a database or NoSQL.
                                            -

                                            -

                                            File system

                                            -

                                            FTP

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            • Object storage: Object Storage Service (OBS)
                                            -
                                            • The file system cannot serve as the destination.
                                            • Only text files such as CSV files can be migrated from FTP or SFTP servers to search services. Binary files cannot.
                                            • Only binary files can be migrated from FTP or SFTP servers to OBS.
                                            • obsutil is recommended for migrating data from HTTP servers to OBS.
                                            -

                                            SFTP

                                            -

                                            HTTP

                                            -

                                            Hadoop: MRS HDFS

                                            -

                                            Relational database

                                            -

                                            RDS for MySQL

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, MRS Hive, and MRS Hudi
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -
                                            • You are advised to use Data Replication Service (DRS) to migrate data between OLTP databases.
                                            • Recommended Microsoft SQL Server version: 2005 or later
                                            -

                                            RDS for SQL Server

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            RDS for PostgreSQL

                                            -

                                            MySQL

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, MRS Hive, and MRS Hudi
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            PostgreSQL

                                            -

                                            Oracle

                                            -

                                            Microsoft SQL Server

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            SAP HANA

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS Hive
                                            -
                                            SAP HANA data sources have the following restrictions:
                                            • SAP HANA cannot serve as the destination.
                                            • Only the 2.00.050.00.1592305219 version is supported.
                                            • Only the Generic Edition is supported.
                                            • BW/4 FOR HANA is not supported.
                                            • Only database names, table names, and column names consisting of English letters are supported. Special characters such as spaces and symbols are not allowed.
                                            • The following data types are supported: date, digit, Boolean, and character (except SHORTTEXT). Other data types such as binary are not supported.
                                            • During migration, tables cannot be automatically created at the destination.
                                            -
                                            -

                                            Database sharding

                                            -
                                            • Data warehouse: Data Lake Insight (DLI)
                                            • Hadoop: MRS HBase and MRS Hive
                                            -
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -
                                            • Object storage: Object Storage Service (OBS)
                                            -

                                            Database shards cannot serve as the destination.

                                            -

                                            ShenTong

                                            -
                                            • Hadoop: MRS Hive and MRS Hudi
                                            -

                                            -

                                            -

                                            NoSQL

                                            -

                                            Distributed Cache Service (DCS)

                                            -

                                            Hadoop: MRS HDFS, MRS HBase, and MRS Hive

                                            -

                                            NoSQL except CloudTable cannot serve as the destination.

                                            -

                                            Redis

                                            -

                                            Document Database Service (DDS)

                                            -

                                            MongoDB

                                            -

                                            CloudTable HBase

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, RDS for SQL Server, MySQL, PostgreSQL, Microsoft SQL Server, and Oracle
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            Cassandra

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            Message system

                                            -

                                            -

                                            -

                                            Apache Kafka

                                            -

                                            Search: Cloud Search Service (CSS)

                                            -

                                            The message system cannot serve as the destination.

                                            -

                                            DMS Kafka

                                            -

                                            MRS Kafka

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -
                                            • MRS Kafka cannot serve as the destination.
                                            • Supported only by local storage and not in storage-compute decoupling scenarios.
                                            • Not supported by Ranger
                                            • Not supported if SSL is enabled for ZooKeeper.
                                            • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                              -
                                            -

                                            Search

                                            -

                                            -

                                            Elasticsearch

                                            -
                                            • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                            • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                            • Object storage: Object Storage Service (OBS)
                                            • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                            • NoSQL: CloudTable
                                            • Search: Elasticsearch and Cloud Search Service (CSS)
                                            -

                                            Only the non-security mode is supported.

                                            -

                                            Cloud Search Service (CSS)

                                            -

                                            -

                                            -
                                            -
                                            -

                                            In the preceding table, the non-cloud data sources, such as MySQL, include on-premises MySQL, MySQL built on ECSs, or MySQL on the third-party cloud.

                                            -
                                            - - -

                                            Supported Data Sources in Entire DB Migration

                                            Entire DB migration is used when an on-premises data center or a database created on an ECS needs to be synchronized to a database service or big data service on the cloud. It is suitable for offline database migration but not online real-time migration.

                                            -

                                            Table 2 lists the data sources supporting entire DB migration using CDM.

                                            - -
                                            - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
                                            Table 2 Supported data sources in entire DB migration

                                            Category

                                            -

                                            Data Source

                                            -

                                            Read

                                            -

                                            Write

                                            -

                                            Description

                                            -

                                            Data warehouse

                                            -

                                            GaussDB(DWS)

                                            -

                                            Supported

                                            -

                                            Supported

                                            -

                                            -

                                            -

                                            Hadoop

                                            -

                                            (available only for local storage, and not for storage-compute decoupling, Ranger, or ZooKeeper for which SSL is enabled)

                                            -

                                            MRS HBase

                                            -

                                            Supported

                                            -

                                            Supported

                                            -

                                            Entire DB migration only to MRS HBase

                                            -
                                            Recommended versions:
                                            • 2.1.X
                                            • 1.3.X
                                            -
                                            -

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            -

                                            MRS Hive

                                            -

                                            Supported

                                            -

                                            Supported

                                            -

                                            Entire DB migration only to a relational database

                                            -
                                            2.X versions are not supported. The following versions are recommended:
                                            • 1.2.X
                                            • 3.1.X
                                            -
                                            -

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            -

                                            FusionInsight HBase

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -
                                            Recommended versions:
                                            • 2.1.X
                                            • 1.3.X
                                            -
                                            -

                                            FusionInsight Hive

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -

                                            Entire DB migration only to a relational database

                                            -
                                            2.X versions are not supported. The following versions are recommended:
                                            • 1.2.X
                                            • 3.1.X
                                            -
                                            -

                                            Apache HBase

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -
                                            Recommended versions:
                                            • 2.1.X
                                            • 1.3.X
                                            -
                                            -

                                            Apache Hive

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -

                                            Entire DB migration only to a relational database

                                            -
                                            2.X versions are not supported. The following versions are recommended:
                                            • 1.2.X
                                            • 3.1.X
                                            -
                                            -

                                            MRS Hudi

                                            -

                                            Supported

                                            -

                                            Supported

                                            -

                                            Supported only by local storage and in storage-compute decoupling scenarios

                                            -

                                            2.X versions are not supported. The following versions are recommended:

                                            -
                                            • 1.2.X
                                            • 3.1.X
                                            -

                                            MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                            -

                                            Relational database

                                            -

                                            RDS for MySQL

                                            -

                                            Supported

                                            -

                                            Supported

                                            -

                                            Migration from OLTP to OLTP is not supported. In this scenario, you are advised to use the Data Replication Service (DRS).

                                            -

                                            RDS for PostgreSQL

                                            -

                                            Supported

                                            -

                                            Supported

                                            -

                                            RDS for SQL Server

                                            -

                                            Supported

                                            -

                                            Supported

                                            -

                                            MySQL

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -

                                            PostgreSQL

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -

                                            Microsoft SQL Server

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -

                                            Oracle

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -

                                            SAP HANA

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -
                                            • Only the 2.00.050.00.1592305219 version is supported.
                                            • Only the Generic Edition is supported.
                                            • BW/4 FOR HANA is not supported.
                                            • Only database names, table names, and column names consisting of English letters are supported. Special characters such as spaces and symbols are not allowed.
                                            • The following data types are supported: date, digit, Boolean, and character (except SHORTTEXT). Other data types such as binary are not supported.
                                            • During migration, tables cannot be automatically created at the destination.
                                            -

                                            Dameng database

                                            -

                                            Supported

                                            -

                                            Not supported

                                            -

                                            Only to DWS and Hive

                                            -

                                            NoSQL

                                            -

                                            Distributed Cache Service (DCS)

                                            -

                                            Not supported

                                            -

                                            Supported

                                            -

                                            Only migration from MRS to DCS is supported.

                                            -

                                            Document Database Service (DDS)

                                            -

                                            Supported

                                            -

                                            Supported

                                            -

                                            Only migration between DDS and MRS is supported.

                                            -

                                            CloudTable

                                            -

                                            Supported

                                            -

                                            Supported

                                            -

                                            -

                                            -
                                            -
                                            -
                                            - -
                                            - -
                                            - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0209.html b/docs/dataartsstudio/umn/dataartsstudio_01_0209.html index 6d7a7b9df..c0f15a7be 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0209.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0209.html @@ -2,13 +2,15 @@

                                            Converting Unsupported Data Types

                                            Scenario

                                            When field mapping is configured on CDM, a message is displayed indicating that the data type of the field is not supported and the field needs to be deleted. If you need to use this field, you can use SQL statements to convert the field type in the source job configuration to the type supported by CDM for data migration.

                                            -

                                            +

                                            -

                                            Procedure

                                            1. Modify the CDM migration job and enable Use SQL Statement.

                                              +

                                              Procedure

                                              1. Modify the CDM migration job and enable Use SQL Statement.

                                                +

                                                The SQL statement format is as follows: select id,cast(Original field name as INT) as New field name, which can be the same as the original field name from schemaName.tableName;

                                                -

                                                For example, select `id`, `name`, cast(`sex` AS char(255) ) AS `sex` from `test_1117869`.`test_no_support_type`;

                                                +

                                                Example: select `id`, `name`, cast(`gender` AS char(255) ) AS `gender` from `test_1117869`.`test_no_support_type`;

                                                -

                                              2. Wait for the fields to be converted to the data types supported by CDM.

                                                +

                                              3. Wait for the fields to be converted to the data types supported by CDM.

                                                +

                                            @@ -18,3 +20,10 @@
                                            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0215.html b/docs/dataartsstudio/umn/dataartsstudio_01_0215.html index b22a3e1a6..4f836359c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0215.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0215.html @@ -10,8 +10,6 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0224.html b/docs/dataartsstudio/umn/dataartsstudio_01_0224.html index 031646bca..bf66819ec 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0224.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0224.html @@ -82,7 +82,7 @@

                                            CHAR(M)

                                            A fixed-length string of 1 to 255 characters, for example, CHAR(5).

                                            +

                                            A fixed-length string of 1 to 255 characters, for example, CHAR(5). The string is padded to a specified length with spaces on the right.

                                            The length limit is not mandatory. It is set to 1 by default.

                                            'a' or 'aaaaa'

                                            @@ -94,7 +94,7 @@

                                            VARCHAR(M)

                                            A variable-length string consists of 1 to 255 characters (more than 255 characters for MySQL of a later version). Example: VARCHAR(25).

                                            +

                                            A variable-length string of 1 to 255 characters (more than 255 characters for MySQL of a later version), for example, VARCHAR(25).

                                            When creating a field of the VARCHAR type, you must define the length.

                                            'a' or 'aaaaa'

                                            @@ -202,7 +202,7 @@

                                            A medium-sized integer that can be signed. If the value is signed, it ranges from -8388608 to 8388607.

                                            If the value is unsigned, it ranges from 0 to 16777215, and you can specify a maximum of 9-bit width.

                                            -128, 127

                                            +

                                            -128 to 127

                                            INT

                                            BIT(M)

                                            Stored bit type value. BIT(M) can store up to M bits of values, and M ranges from 1 to 64.

                                            +

                                            Stored bit type value. BIT(M) can store up to M bits of values, and M ranges from 1 to 64.

                                            B'1111100' B'1100'

                                            TIMESTAMP

                                            Timestamp type. Timestamp between midnight on January 1, 1970 and a time point in 2037. Similar to the DATETIME format (YYYYMMDDHHMMSS), except that no hyphen is required. For example, 3:30 p.m. December 30, 1973 will be stored as 19731230153000.

                                            +

                                            Timestamp type. Timestamp between midnight on January 1, 1970 and a time point in 2037. Similar to the DATETIME format (YYYYMMDDHHMMSS), except that no hyphen is required. For example, 3:30 p.m. December 30, 1973 will be stored as 19731230153000.

                                            19731230153000

                                            BINARY(M)

                                            The number of bytes is M. The length of a variable-length binary string ranges from 0 to M. M is the value length plus 1.

                                            +

                                            The number of bytes is M. The length of a variable-length binary string ranges from 0 to M. M is the value length plus 1.

                                            0x2A3B4058 (binary data)

                                            VARBINARY(M)

                                            The number of bytes is M. A fixed binary string with a length of 0 to M.

                                            +

                                            The number of bytes is M. A fixed binary string with a length of 0 to M.

                                            0x2A3B4059 (binary data)

                                            int

                                            int is stored in four bytes, where one binary bit represents a sign bit, and the other 31 binary bits represent a length and a size, and may represent all integers ranging from –231 to 231 – 1.

                                            +

                                            int is stored in four bytes, where one binary bit represents a sign bit, and the other 31 binary bits represent a length and a size, and may represent all integers ranging from –231 to 231 – 1.

                                            INT

                                            smallmoney

                                            Similar to the money type, a currency symbol is prefixed to the input data. For example, the currency symbol of CNY is ¥.

                                            +

                                            Similar to the money type, a currency symbol is prefixed to the input data. For example, the currency symbol of USD is $.

                                            Not supported (string)

                                            bit

                                            Fixed-length string, for example, b'000101'

                                            +

                                            Fixed-length string, for example, b'000101'

                                            Not supported (string)

                                            varbit

                                            Variable-length string, for example, b'101'

                                            +

                                            Variable-length string, for example, b'101'

                                            Not supported (string)

                                            int

                                            int is stored in four bytes, where one binary bit represents a sign bit, and the other 31 binary bits represent a length and a size, and may represent all integers ranging from –231 to 231 – 1.

                                            +

                                            int is stored in four bytes, where one binary bit represents a sign bit, and the other 31 binary bits represent a length and a size, and may represent all integers ranging from –231 to 231 – 1.

                                            bigint

                                            @@ -1575,9 +1575,9 @@

                                            52.36

                                            DECIMAL(10,0)

                                            +

                                            DECIMAL(10, 0)

                                            DECIMAL(18,0)

                                            +

                                            DECIMAL(18, 0)

                                            INT

                                            @@ -1685,8 +1685,7 @@

                                            Stores information about the year, month, day, hour, minute, and second.

                                            2002-12-12 09:10:21','2002-12-12 9:10:21'

                                            -

                                            '2002/12/12 09:10:21' or '2002.12.12 09:10:21'

                                            +

                                            '2002-12-12 09:10:21', '2002-12-12 9:10:21', '2002/12/12 09:10:21', or '2002.12.12 09:10:21'

                                            TIMESTAMP

                                            TEXT

                                            It is used to store long character strings. The maximum length of a string is 2 GB minus 1 byte. Long text strings are stored.

                                            +

                                            Stores long character strings. The maximum length of a character string is 2 GB minus 1 byte. Long text strings are stored.

                                            Value

                                            @@ -1863,7 +1862,7 @@

                                            STRING

                                            It is used to store long character strings. The maximum length of a character string is 2 GB minus 1 byte. Long text strings are stored.

                                            +

                                            Stores long character strings. The maximum length of a character string is 2 GB minus 1 byte. Long text strings are stored.

                                            Value

                                            @@ -1930,9 +1929,9 @@
                                            - - @@ -1945,7 +1944,7 @@ - @@ -1983,7 +1982,7 @@ - @@ -1992,7 +1991,7 @@ - @@ -2038,7 +2037,7 @@ @@ -2158,567 +2157,687 @@
                                            Table 10 Data types supported for the Elasticsearch/CSS database

                                            Category

                                            Type

                                            +

                                            Type

                                            Description

                                            +

                                            Description

                                            Storage Format Example

                                            keyword

                                            Stores character strings.

                                            +

                                            Stores strings.

                                            "keyword"

                                            integer

                                            Stores 32-bit signed integers ranging from –231 to 231 – 1.

                                            +

                                            Stores 32-bit signed integers ranging from –231 to 231 – 1.

                                            3276566

                                            long

                                            Stores 64-bit signed integers ranging from –263 to 263 – 1.

                                            +

                                            Stores 64-bit signed integers ranging from –263 to 263 – 1.

                                            3276566666

                                            {"users.name":["John","Smith"],

                                            users.age":[26,28],

                                            -

                                            "users.sex":[1,2]}

                                            +

                                            "users.gender":[1, 2]}

                                            TEXT

                                            @@ -2052,10 +2051,10 @@

                                            {"users.name" : "John" ,

                                            "users.age" : 26,

                                            -

                                            "users.sex" : 1}

                                            +

                                            "users.gender" : 1}

                                            { "users.name" : "Smith",

                                            "users.age" : 28,

                                            -

                                            "users.sex" : 2}

                                            +

                                            "users.gender" : 2}

                                            TEXT

                                            -

                                            Data Types Supported in Dameng Database Migration

                                            When the source end is a Dameng database and the destination end is a Hive or DWS database, the following data types are supported.

                                            +

                                            Data Types Supported in Doris Database Migration

                                            If the migration source is a Doris database, the following data types are supported.

                                            -
                                            - - - @@ -100,7 +100,7 @@
                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0252.html b/docs/dataartsstudio/umn/dataartsstudio_01_0252.html index 1bf046666..4d269ba87 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0252.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0252.html @@ -27,7 +27,7 @@ - @@ -80,7 +80,7 @@
                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0286.html b/docs/dataartsstudio/umn/dataartsstudio_01_0286.html index 175e77f10..1d8d610c2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0286.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0286.html @@ -48,7 +48,7 @@ - - - @@ -107,7 +107,7 @@
                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0291.html b/docs/dataartsstudio/umn/dataartsstudio_01_0291.html index a365cf860..c9a94c60d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0291.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0291.html @@ -25,8 +25,8 @@ - - @@ -51,22 +51,21 @@ - - - @@ -74,8 +73,8 @@ - @@ -83,10 +82,12 @@ - @@ -94,9 +95,13 @@ - @@ -104,30 +109,33 @@ - - - - @@ -135,8 +143,8 @@ - @@ -145,14 +153,14 @@ - - @@ -160,7 +168,7 @@ - @@ -168,16 +176,60 @@ - + + + + + + + + + + + + + + + + + + +
                                            Table 11 Data types supported for the Dameng database

                                            Category

                                            +
                                            - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - +
                                            Table 11 Data types supported for the Doris database

                                            Category

                                            Type

                                            +

                                            Type

                                            Description

                                            -

                                            Storage Format Example

                                            -

                                            Hive

                                            -

                                            DWS

                                            +

                                            Description

                                            Character

                                            +

                                            String

                                            +

                                            CHAR

                                            +

                                            CHAR(M)

                                            Stores specified fixed-length character strings.

                                            -

                                            'a' or 'aaaaa'

                                            -

                                            CHAR

                                            -

                                            CHAR

                                            +

                                            Range: char[(length)]. A fixed-length string of 1 to 255 characters (1 by default).

                                            CHARACTER

                                            +

                                            VARCHAR(M)

                                            Same as CHAR

                                            -

                                            'a' or 'aaaaa'

                                            -

                                            CHAR

                                            -

                                            CHAR

                                            +

                                            Range: char(length). A variable-length string of 1 to 65,535 characters.

                                            VARCHAR

                                            +

                                            Value

                                            Stores specified variable-length character strings.

                                            +

                                            DECIMAL(M,D)

                                            'a' or 'aaaaa'

                                            -

                                            VARCHAR

                                            -

                                            VARCHAR

                                            +

                                            Uncompressed floating-point numbers cannot be unsigned. In unpacking decimals, each decimal corresponds to a byte.

                                            +

                                            Defining the number of display lengths (M) and decimals (D) is required. NUMERIC is the synonym of DECIMAL.

                                            VARCHAR2

                                            +

                                            Value type

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            Same as VARCHAR

                                            +

                                            TINYINT

                                            'a' or 'aaaaa'

                                            -

                                            VARCHAR

                                            -

                                            VARCHAR

                                            +

                                            Length: 1-byte signed integer

                                            +

                                            Range: [-128, 127]

                                            Value

                                            +

                                            SMALLINT

                                            NUMERIC

                                            -

                                            Stores zero, positive, and negative fixed point numbers.

                                            -

                                            52.36

                                            -

                                            DECIMAL

                                            -

                                            NUMERIC

                                            +

                                            Length: 2-byte signed integer

                                            +

                                            Range: [-32768, 32767]

                                            DECIMAL

                                            +

                                            INT

                                            Similar to NUMERIC

                                            -

                                            52.36

                                            -

                                            DECIMAL

                                            -

                                            NUMERIC

                                            +

                                            Length: 4-byte signed integer

                                            +

                                            Range: [-2147483648, 2147483647]

                                            DEC

                                            +

                                            BIGINT

                                            Same as DECIMAL

                                            -

                                            52.36

                                            -

                                            DECIMAL

                                            -

                                            NUMERIC

                                            +

                                            Length: 8-byte signed integer

                                            +

                                            Range: [-9223372036854775808, 9223372036854775807]

                                            NUMBER

                                            +

                                            LARGEINT

                                            Same as NUMERIC

                                            -

                                            52.36

                                            -

                                            DECIMAL

                                            -

                                            NUMERIC

                                            +

                                            Length: 16-byte signed integer

                                            +

                                            Range: [-2^127, 2^127-1]

                                            INTEGER

                                            +

                                            FLOAT

                                            Stores signed integers. Integer part: 10 digits; decimal part: 0 digits

                                            -

                                            5236

                                            -

                                            INT

                                            -

                                            INTEGER

                                            +

                                            Length: 4-byte floating point number

                                            +

                                            Range: -3.40E+38 to +3.40E+38

                                            INT

                                            +

                                            DOUBLE

                                            Same as INTEGER

                                            -

                                            5236

                                            -

                                            INT

                                            -

                                            INTEGER

                                            +

                                            Length: 8-byte floating point number

                                            +

                                            Range: -1.79E+308 to +1.79E+308

                                            BIGINT

                                            +

                                            DECIMAL[M,D]

                                            Stores signed integers. Integer part: 19 digits; decimal part: 0 digits

                                            -

                                            5236

                                            -

                                            BIGINT

                                            -

                                            BIGINT

                                            +

                                            Decimal type that ensures precision. M indicates the total number of valid digits, and D indicates the maximum number of digits after the decimal point. The range of M is [1,27], and that of D is [1,9]. In addition, M must be greater than or equal to D. The default value is decimal[10,0].

                                            +

                                            Precision: 1–27

                                            +

                                            Scale: 0–9

                                            TINYINT

                                            +

                                            Date

                                            +

                                            Stores signed integers. Integer part: 3 digits; decimal part: 0 digits

                                            +

                                            DATE

                                            100

                                            -

                                            TINYINT

                                            -

                                            SMALLINT

                                            +

                                            Range: ['1000-01-01', '9999-12-31']. The default printing format is 'YYYY-MM-DD'.

                                            SMALLINT

                                            +

                                            DATETIME

                                            Stores signed integers. Integer part: 5 digits; decimal part: 0 digits

                                            -

                                            9999

                                            -

                                            SMALLINT

                                            -

                                            SMALLINT

                                            +

                                            Range: ['1000-01-01 00:00:00', '9999-12-31 00:00:00']. The default printing format is 'YYYY-MM-DD HH:MM:SS'.

                                            BYTE

                                            +

                                            Special type

                                            +

                                            Similar to TINYINT. Integer part: 3 digits; decimal part: 0 digits

                                            +

                                            HLL

                                            100

                                            -

                                            TINYINT

                                            -

                                            SMALLINT

                                            +

                                            HyperLogLog (HLL) is a binary type. It can be used only for aggregation tables, and the aggregation type must be HLL_UNION.

                                            +

                                            This type is mainly used to pre-aggregate data in non-accurate and fast deduplication scenarios.

                                            +

                                            HLL columns can be queried or used only using hll_union_agg, hll_cardinality, or hll_hash.

                                            BINARY

                                            +

                                            BITMAP

                                            Stores fixed-length binary data.

                                            -

                                            0x2A3B4058

                                            -

                                            BINARY (NULL)

                                            -

                                            BYTEA (NULL)

                                            +

                                            BITMAP is a binary type. It can be used only for aggregation tables, and the aggregation type must be BITMAP_UNION.

                                            +

                                            This type is mainly used to pre-aggregate data in accurate deduplication scenarios. It can also be used to store user IDs in user profile scenarios.

                                            +

                                            BITMAP columns can be queried or used only using BITMAP functions.

                                            VARBINARY

                                            +
                                            +
                                            + +

                                            Data Types Supported in Dameng Database Migration

                                            When the source end is a Dameng database and the destination end is a Hive or DWS database, the following data types are supported.

                                            + +
                                            + + + + + + + + - - - - + - - - - - - - - - - - - - - - - - - - - + - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + - - - - - + - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0226.html b/docs/dataartsstudio/umn/dataartsstudio_01_0226.html index a5c69d957..11fd58fef 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0226.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0226.html @@ -1,6 +1,6 @@ -

                                            Link to DWS

                                            +

                                            GaussDB(DWS) Link Parameters

                                            Table 1 describes the DWS link parameters.

                                            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

                                            @@ -58,16 +58,16 @@
                                            - - - - + + + + - + + + +
                                            Table 12 Data types supported for the Dameng database

                                            Category

                                            +

                                            Type

                                            +

                                            Description

                                            +

                                            Storage Format Example

                                            +

                                            Hive

                                            +

                                            DWS

                                            +

                                            Character

                                            Stores variable-length binary data.

                                            +

                                            CHAR

                                            0x2A3B4058

                                            +

                                            Stores specified fixed-length character strings.

                                            BINARY (NULL)

                                            +

                                            'a' or 'aaaaa'

                                            BYTEA (NULL)

                                            +

                                            CHAR

                                            +

                                            CHAR

                                            FLOAT

                                            +

                                            CHARACTER

                                            Stores floating-point numbers with binary precision.

                                            +

                                            Same as CHAR

                                            52.36

                                            +

                                            'a' or 'aaaaa'

                                            FLOAT

                                            +

                                            CHAR

                                            FLOAT8

                                            +

                                            CHAR

                                            DOUBLE

                                            +

                                            VARCHAR

                                            Similar to FLOAT

                                            +

                                            Stores specified variable-length character strings.

                                            52.36

                                            +

                                            'a' or 'aaaaa'

                                            DOUBLE

                                            +

                                            VARCHAR

                                            FLOAT8

                                            +

                                            VARCHAR

                                            REAL

                                            +

                                            VARCHAR2

                                            Stores binary floating-point numbers.

                                            +

                                            Same as VARCHAR

                                            52.3

                                            +

                                            'a' or 'aaaaa'

                                            FLOAT

                                            +

                                            VARCHAR

                                            FLOAT4

                                            +

                                            VARCHAR

                                            DOUBLE PRECISION

                                            +

                                            Value

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            +

                                            Stores double-precision floating-point numbers.

                                            +

                                            NUMERIC

                                            52.3

                                            +

                                            Stores zero, positive, and negative fixed point numbers.

                                            DOUBLE

                                            +

                                            52.36

                                            FLOAT8

                                            +

                                            DECIMAL

                                            +

                                            NUMERIC

                                            Bit string

                                            +

                                            DECIMAL

                                            BIT

                                            +

                                            Similar to NUMERIC

                                            Stores 1, 0, or NULL.

                                            +

                                            52.36

                                            1, 0, or NULL

                                            +

                                            DECIMAL

                                            TINYINT(1 0 NULL)

                                            -

                                            BOOLEAN(true false NULL)

                                            +

                                            NUMERIC

                                            Time and date

                                            +

                                            DEC

                                            DATE

                                            +

                                            Same as DECIMAL

                                            Stores information about the year, month, and day.

                                            +

                                            52.36

                                            '1999-10-01', '1999/10/01', or '1999.10.01'

                                            +

                                            DECIMAL

                                            DATE

                                            -

                                            TIMESTAMP

                                            +

                                            NUMERIC

                                            TIME

                                            +

                                            INTEGER

                                            Stores information about the hour, minute, and second.

                                            +

                                            Stores signed integers. Integer part: 10 digits; decimal part: 0 digits

                                            '09:10:21' or '9:10:21'

                                            +

                                            5236

                                            Not supported (string)

                                            +

                                            INT

                                            TIME

                                            +

                                            INTEGER

                                            TIMESTAMP

                                            +

                                            INT

                                            Stores information about the year, month, day, hour, minute, and second.

                                            +

                                            Same as INTEGER

                                            2002-12-12 09:10:21','2002-12-12 9:10:21'

                                            -

                                            '2002/12/12 09:10:21' or '2002.12.12 09:10:21'

                                            +

                                            5236

                                            TIMESTAMP

                                            +

                                            INT

                                            TIMESTAMP

                                            +

                                            INTEGER

                                            TIME WITH TIME ZONE

                                            +

                                            BIGINT

                                            Stores a TIME value with a time zone. Add the time zone information to the end of the TIME type.

                                            +

                                            Stores signed integers. Integer part: 19 digits; decimal part: 0 digits

                                            '09:10:21 +8:00', '09:10:21+8:00' or '9:10:21+8:00'

                                            +

                                            5236

                                            Not supported (string)

                                            +

                                            BIGINT

                                            TIME WITH TIME ZONE

                                            +

                                            BIGINT

                                            TIMESTAMP WITH TIME ZONE

                                            +

                                            TINYINT

                                            Stores a TIMESTAMP value with a time zone. Add the time zone information to the end of the TIMESTAMP type.

                                            +

                                            Stores signed integers. Integer part: 3 digits; decimal part: 0 digits

                                            2002-12-12 09:10:21 +8:00','2002-12-12 9:10:21 +8:00'

                                            -

                                            '2002/12/12 09:10:21 +8:00' or '2002.12.12 09:10:21 +8:00'

                                            +

                                            100

                                            TIMESTAMP

                                            +

                                            TINYINT

                                            TIMESTAMP WITH TIME ZONE

                                            +

                                            SMALLINT

                                            TIMESTAMP WITH LOCAL TIME ZONE

                                            +

                                            SMALLINT

                                            Stores the TIMESTAMP value of a local time zone. The standard time zone type (TIMESTAMP WITH TIME ZONE) can be converted to the local time zone type.

                                            +

                                            Stores signed integers. Integer part: 5 digits; decimal part: 0 digits

                                            2002-12-12 09:10:21 +8:00','2002-12-12 9:10:21 +8:00'

                                            -

                                            '2002/12/12 09:10:21 +8:00' or '2002.12.12 09:10:21 +8:00'

                                            +

                                            9999

                                            Not supported (string)

                                            +

                                            SMALLINT

                                            Not supported (TEXT)

                                            +

                                            SMALLINT

                                            DATETIME WITH TIME ZONE

                                            +

                                            BYTE

                                            Same as TIMESTAMP WITH TIME ZONE

                                            +

                                            Similar to TINYINT. Integer part: 3 digits; decimal part: 0 digits

                                            2002-12-12 09:10:21 +8:00','2002-12-12 9:10:21 +8:00'

                                            -

                                            '2002/12/12 09:10:21 +8:00' or '2002.12.12 09:10:21 +8:00'

                                            +

                                            100

                                            TIMESTAMP

                                            +

                                            TINYINT

                                            TIMESTAMP WITH TIME ZONE

                                            +

                                            SMALLINT

                                            INTERVAL YEAR

                                            +

                                            BINARY

                                            Interval of years. The leading precision specifies the range of years.

                                            +

                                            Stores fixed-length binary data.

                                            INTERVAL '0015' YEAR

                                            +

                                            0x2A3B4058

                                            Not supported (string)

                                            +

                                            BINARY (NULL)

                                            Not supported (VARCHAR)

                                            +

                                            BYTEA (NULL)

                                            INTERVAL YEAR TO MONTH

                                            +

                                            VARBINARY

                                            Interval of months and years. The leading precision specifies the range of years.

                                            +

                                            Stores variable-length binary data.

                                            INTERVAL '0015-08' YEAR TO MONTH

                                            +

                                            0x2A3B4058

                                            Not supported (string)

                                            +

                                            BINARY (NULL)

                                            Not supported (VARCHAR)

                                            +

                                            BYTEA (NULL)

                                            INTERVAL MONTH

                                            +

                                            FLOAT

                                            Interval of months. The leading precision specifies the range of months.

                                            +

                                            Stores floating-point numbers with binary precision.

                                            INTERVAL '0015' MONTH

                                            +

                                            52.36

                                            Not supported (string)

                                            +

                                            FLOAT

                                            Not supported (VARCHAR)

                                            +

                                            FLOAT8

                                            INTERVAL DAY

                                            +

                                            DOUBLE

                                            Interval of days. The leading precision specifies the range of days.

                                            +

                                            Similar to FLOAT

                                            INTERVAL '150' DAY

                                            +

                                            52.36

                                            Not supported (string)

                                            +

                                            DOUBLE

                                            Not supported (VARCHAR)

                                            +

                                            FLOAT8

                                            INTERVAL DAY TO HOUR

                                            +

                                            REAL

                                            Interval of hours and days. The leading precision specifies the range of days.

                                            +

                                            Stores binary floating-point numbers.

                                            INTERVAL '9 23' DAY TO HOUR

                                            +

                                            52.3

                                            Not supported (string)

                                            +

                                            FLOAT

                                            Not supported (VARCHAR)

                                            +

                                            FLOAT4

                                            INTERVAL DAY TO MINUTE

                                            +

                                            DOUBLE PRECISION

                                            Interval of minutes, hours, and days. The leading precision specifies the range of days.

                                            +

                                            Stores double-precision floating-point numbers.

                                            INTERVAL '09 23:12' DAY TO MINUTE

                                            +

                                            52.3

                                            Not supported (string)

                                            +

                                            DOUBLE

                                            Not supported (VARCHAR)

                                            +

                                            FLOAT8

                                            INTERVAL DAY TO SECOND

                                            +

                                            Bit string

                                            Interval of seconds, minutes, hours, and days. The leading precision specifies the range of days.

                                            +

                                            BIT

                                            INTERVAL '09 23:12:01.1' DAY TO SECOND

                                            +

                                            Stores 1, 0, or NULL.

                                            Not supported (string)

                                            +

                                            1, 0, or NULL

                                            Not supported (VARCHAR)

                                            +

                                            TINYINT(1 0 NULL)

                                            +

                                            BOOLEAN (true false NULL)

                                            INTERVAL HOUR

                                            +

                                            Time and date

                                            Interval of hours. The leading precision specifies the range of hours.

                                            +

                                            DATE

                                            INTERVAL '150' HOUR

                                            +

                                            Stores information about the year, month, and day.

                                            Not supported (string)

                                            +

                                            '1999-10-01', '1999/10/01', or '1999.10.01'

                                            Not supported (VARCHAR)

                                            +

                                            DATE

                                            +

                                            TIMESTAMP

                                            INTERVAL HOUR TO MINUTE

                                            +

                                            TIME

                                            Interval of minutes and hours. The leading precision specifies the range of hours.

                                            +

                                            Stores information about the hour, minute, and second.

                                            INTERVAL '23:12' HOUR TO MINUTE

                                            +

                                            '09:10:21' or '9:10:21'

                                            Not supported (string)

                                            +

                                            Not supported (string)

                                            Not supported (VARCHAR)

                                            +

                                            TIME

                                            INTERVAL HOUR TO SECOND

                                            +

                                            TIMESTAMP

                                            Interval of seconds, minutes, and hours. The leading precision specifies the range of hours.

                                            +

                                            Stores information about the year, month, day, hour, minute, and second.

                                            INTERVAL '23:12:01.1' HOUR TO SECOND

                                            +

                                            '2002-12-12 09:10:21', '2002-12-12 9:10:21', '2002/12/12 09:10:21', or '2002.12.12 09:10:21'

                                            Not supported (string)

                                            +

                                            TIMESTAMP

                                            Not supported (VARCHAR)

                                            +

                                            TIMESTAMP

                                            INTERVAL MINUTE

                                            +

                                            TIME WITH TIME ZONE

                                            Interval of minutes. The leading precision specifies the range of minutes.

                                            +

                                            Stores a TIME value with a time zone. Add the time zone information to the end of the TIME type.

                                            INTERVAL '150' MINUTE

                                            +

                                            '09:10:21 +8:00', '09:10:21+8:00', or '9:10:21+8:00'

                                            Not supported (string)

                                            +

                                            Not supported (string)

                                            Not supported (VARCHAR)

                                            +

                                            TIME WITH TIME ZONE

                                            INTERVAL MINUTE TO SECOND

                                            +

                                            TIMESTAMP WITH TIME ZONE

                                            Interval of seconds and minutes. The leading precision specifies the range of minutes

                                            -

                                            .

                                            +

                                            Stores a TIMESTAMP value with a time zone. Add the time zone information to the end of the TIMESTAMP type.

                                            INTERVAL '12:01.1' MINUTE TO SECOND

                                            +

                                            '2002-12-12 09:10:21 +8:00', '2002-12-12 9:10:21 +8:00', '2002/12/12 09:10:21 +8:00', or '2002.12.12 09:10:21 +8:00'

                                            Not supported (string)

                                            +

                                            TIMESTAMP

                                            Not supported (VARCHAR)

                                            +

                                            TIMESTAMP WITH TIME ZONE

                                            INTERVAL SECOND

                                            +

                                            TIMESTAMP WITH LOCAL TIME ZONE

                                            Interval of seconds. The leading precision specifies the range of the integer part of the second

                                            -

                                            .

                                            +

                                            Stores the TIMESTAMP value of a local time zone. The standard time zone type (TIMESTAMP WITH TIME ZONE) can be converted to the local time zone type.

                                            INTERVAL '51.1' SECOND

                                            +

                                            '2002-12-12 09:10:21 +8:00', '2002-12-12 9:10:21 +8:00', '2002/12/12 09:10:21 +8:00', or '2002.12.12 09:10:21 +8:00'

                                            Not supported (string)

                                            +

                                            Not supported (string)

                                            Not supported (VARCHAR)

                                            +

                                            Not supported (TEXT)

                                            Multimedia

                                            +

                                            DATETIME WITH TIME ZONE

                                            IMAGE

                                            +

                                            Same as TIMESTAMP WITH TIME ZONE

                                            IMAGE specifies the image type in the multimedia information.

                                            +

                                            '2002-12-12 09:10:21 +8:00', '2002-12-12 9:10:21 +8:00', '2002/12/12 09:10:21 +8:00', or '2002.12.12 09:10:21 +8:00'

                                            +

                                            TIMESTAMP

                                            +

                                            TIMESTAMP WITH TIME ZONE

                                            +

                                            INTERVAL YEAR

                                            +

                                            Interval of years. The leading precision specifies the range of years.

                                            +

                                            INTERVAL '0015' YEAR

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL YEAR TO MONTH

                                            +

                                            Interval of months and years. The leading precision specifies the range of years.

                                            +

                                            INTERVAL '0015-08' YEAR TO MONTH

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL MONTH

                                            +

                                            Interval of months. The leading precision specifies the range of months.

                                            +

                                            INTERVAL '0015' MONTH

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL DAY

                                            +

                                            Interval of days. The leading precision specifies the range of days.

                                            +

                                            INTERVAL '150' DAY

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL DAY TO HOUR

                                            +

                                            Interval of hours and days. The leading precision specifies the range of days.

                                            +

                                            INTERVAL '9 23' DAY TO HOUR

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL DAY TO MINUTE

                                            +

                                            Interval of minutes, hours, and days. The leading precision specifies the range of days.

                                            +

                                            INTERVAL '09 23:12' DAY TO MINUTE

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL DAY TO SECOND

                                            +

                                            Interval of seconds, minutes, hours, and days. The leading precision specifies the range of days.

                                            +

                                            INTERVAL '09 23:12:01.1' DAY TO SECOND

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL HOUR

                                            +

                                            Interval of hours. The leading precision specifies the range of hours.

                                            +

                                            INTERVAL '150' HOUR

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL HOUR TO MINUTE

                                            +

                                            Interval of minutes and hours. The leading precision specifies the range of hours.

                                            +

                                            INTERVAL '23:12' HOUR TO MINUTE

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL HOUR TO SECOND

                                            +

                                            Interval of seconds, minutes, and hours. The leading precision specifies the range of hours.

                                            +

                                            INTERVAL '23:12:01.1' HOUR TO SECOND

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL MINUTE

                                            +

                                            Interval of minutes. The leading precision specifies the range of minutes.

                                            +

                                            INTERVAL '150' MINUTE

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL MINUTE TO SECOND

                                            +

                                            Interval of minutes and seconds. The leading precision specifies the range of minutes.

                                            +

                                            INTERVAL '12:01.1' MINUTE TO SECOND

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            INTERVAL SECOND

                                            +

                                            Interval of seconds. The leading precision specifies the value range of the integer part of the second

                                            +

                                            INTERVAL '51.1' SECOND

                                            +

                                            Not supported (string)

                                            +

                                            Not supported (VARCHAR)

                                            +

                                            Multimedia

                                            +

                                            IMAGE

                                            +

                                            IMAGE specifies the image type in the multimedia information.

                                            An image consists of a pixel lattice with a maximum length of 2 GB minus 1 byte. In addition to storing image data, other binary data can also be stored.

                                            0x2A3B4058 (binary data)

                                            +

                                            0x2A3B4058 (binary data)

                                            Not supported

                                            +

                                            Not supported

                                            Not supported

                                            +

                                            Not supported

                                            LONGVARBINARY

                                            +

                                            LONGVARBINARY

                                            Same as IMAGE

                                            +

                                            Same as IMAGE

                                            0x2A3B4059 (binary data)

                                            +

                                            0x2A3B4059 (binary data)

                                            Not supported

                                            +

                                            Not supported

                                            Not supported

                                            +

                                            Not supported

                                            TEXT

                                            +

                                            TEXT

                                            Stores the long string type.

                                            +

                                            Stores the long string type.

                                            The maximum length of a string is 2 GB minus 1 byte.

                                            0x5236 (binary data)

                                            +

                                            0x5236 (binary data)

                                            Not supported

                                            +

                                            Not supported

                                            Not supported

                                            +

                                            Not supported

                                            LONGVARCHAR

                                            +

                                            LONGVARCHAR

                                            Similar to TEXT

                                            +

                                            Similar to TEXT

                                            0x5236 (binary data)

                                            +

                                            0x5236 (binary data)

                                            Not supported

                                            +

                                            Not supported

                                            Not supported

                                            +

                                            Not supported

                                            BLOB

                                            +

                                            BLOB

                                            Stores variable-length binary large objects with a maximum length of 2 GB minus 1 byte.

                                            +

                                            Stores variable-length binary large objects with a maximum length of 2 GB minus 1 byte.

                                            0x5236 (binary data)

                                            +

                                            0x5236 (binary data)

                                            Not supported

                                            +

                                            Not supported

                                            Not supported

                                            +

                                            Not supported

                                            CLOB

                                            +

                                            CLOB

                                            Stores variable-length binary large objects with a maximum length of 2 GB minus 1 byte.

                                            +

                                            Stores variable-length binary large objects with a maximum length of 2 GB minus 1 byte.

                                            0x5236 (binary data)

                                            +

                                            0x5236 (binary data)

                                            Not supported

                                            +

                                            Not supported

                                            Not supported

                                            +

                                            Not supported

                                            BFILE

                                            +

                                            BFILE

                                            Specified the binary files stored in the operating systems.

                                            +

                                            Specified the binary files stored in the operating systems.

                                            Files are stored in the operating systems instead of the databases. They can be read only.

                                            -

                                            +

                                            -

                                            Not supported

                                            +

                                            Not supported

                                            Not supported

                                            +

                                            Not supported

                                            Use Agent

                                            Whether to extract data from the data source through an agent

                                            +

                                            The agent function will be unavailable soon and does not need to be configured.

                                            Yes

                                            +

                                            -

                                            Agent

                                            Click Select and select the agent created in Managing Agents.

                                            +

                                            The agent function will be unavailable soon and does not need to be configured.

                                            -

                                            +

                                            -

                                            Reference Sign

                                            @@ -85,9 +85,17 @@

                                            1000

                                            Commit Size

                                            +

                                            (Optional) Displayed when you click Show Advanced Attributes.

                                            +

                                            Number of records submitted each time. Set this parameter based on the destination and data size of the job. If the value is too large or too small, the job execution time may be affected.

                                            +

                                            10000

                                            +

                                            SSL Encryption

                                            (Optional) If you set this parameter to Yes, CDM can connect to the database (on-premises databases excluded) in SSL encryption mode.

                                            +

                                            Whether to connect to the data warehouse in SSL mode

                                            Yes

                                            NOTE:

                                            To enable SSL encryption, you must ensure that it is enabled for GaussDB(DWS).

                                            @@ -105,13 +113,21 @@

                                            Link Secret Attributes

                                            +

                                            (Optional) Displayed when you click Show Advanced Attributes.

                                            +

                                            Custom secret attributes of the link

                                            +

                                            sk=09fUgD5WOF1L6f

                                            +
                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0227.html b/docs/dataartsstudio/umn/dataartsstudio_01_0227.html index f6bd0ed32..a1e6062e9 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0227.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0227.html @@ -1,6 +1,6 @@ -

                                            Link to SAP HANA

                                            +

                                            SAP HANA Link Parameters

                                            Table 1 describes the SAP HANA link parameters.

                                            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

                                            @@ -58,14 +58,14 @@

                                            Use Agent

                                            Whether to extract data from the data source through an agent

                                            +

                                            The agent function will be unavailable soon and does not need to be configured.

                                            Yes

                                            +

                                            -

                                            Agent

                                            Click Select and select the agent created in Managing Agents.

                                            +

                                            The agent function will be unavailable soon and does not need to be configured.

                                            -

                                            Name of the table to which data will be written. Click the icon next to the text box. The dialog box for selecting the table is displayed.

                                            This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                            -
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            +
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            table

                                            @@ -89,7 +89,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0261.html b/docs/dataartsstudio/umn/dataartsstudio_01_0261.html index 2baae0851..8cfb6a018 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0261.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0261.html @@ -1,13 +1,13 @@ -

                                            Configuring Field Mapping

                                            -

                                            Scenario

                                            • After the job parameters are configured, you can configure field mapping. You can click on the Map Field page to customize new fields or click in the Operation column to create a field converter.
                                            • If files are migrated between FTP, SFTP, OBS, and HDFS and the migration source's File Format is set to Binary, files will be directly transferred, free from field mapping.
                                            • In other scenarios, CDM automatically maps fields of the source table and the destination table. You need to check whether the mapping and time format are correct. For example, check whether the source field type can be converted into the destination field type.
                                            • In the auto table creation scenario, you need to add fields to the destination table in advance, and add the fields to the field mapping.
                                            +

                                            Configuring CDM Job Field Mapping

                                            +

                                            Scenario

                                            • After the job parameters are configured, you can configure field mapping. You can click on the Map Field page to customize new fields or click in the Operation column to create a field converter.
                                            • If files are migrated between FTP, SFTP, OBS, and HDFS and the migration source's File Format is set to Binary, files will be directly transferred, free from field mapping.
                                            • In other scenarios, CDM automatically maps fields of the source table and the destination table. You need to check whether the mapping and time format are correct. For example, check whether the source field type can be converted into the destination field type.
                                            • In the auto table creation scenario, you need to add fields to the destination table in advance, and add the fields to the field mapping.

                                            Constraints

                                            • If Use SQL Statement is set to Yes in the source job configuration, converters cannot be created.
                                            -
                                            • On the Map Field tab page, if CDM fails to obtain all columns by obtaining sample values (for example, when data is exported from HBase, CloudTable, or MongoDB, there is a high probability that CDM failed to obtain all columns), you can click and select Add a new field to add new fields to ensure that the data imported to the migration destination is complete.
                                            • When a relational database, Hive, DLI, or MRS Hudi is used as the migration source, sample values cannot be obtained.
                                            • When SQLServer is the destination, fields of the timestamp type cannot be written. You must change their type (for example, to datetime) so that they can be written.
                                            • Column names are displayed when the source of the migration job is OBS, CSV files are to be migrated, and parameter Extract first row as columns is set to Yes.
                                            • Field mapping is not involved when the binary format is used to migrate files to files.
                                            • In the automatic table creation scenario, you need to manually add fields to the destination table in advance and then add fields to the field mapping.
                                            • After a field is added, its sample value is not displayed on the console. This does not affect the field value transmission. CDM directly writes the field value to the destination end.
                                            • If the field mapping is incorrect, you can adjust the field mapping by dragging fields or clicking to map fields in batches.
                                            • If the data is imported to DWS, you need to select the distribution columns in the destination fields. You are advised to select the distribution columns according to the following principles:
                                              1. Use the primary key as the distribution column.
                                              2. If multiple data segments are combined as primary keys, specify all primary keys as the distribution column.
                                              3. In the scenario where no primary key is available, if no distribution column is selected, DWS uses the first column as the distribution column by default. As a result, data skew risks exist.
                                              +
                                              • On the Map Field tab page, if CDM fails to obtain all columns by obtaining sample values (for example, when data is exported from HBase, CloudTable, or MongoDB, there is a high probability that CDM failed to obtain all columns), you can click and select Add a new field to add new fields to ensure that the data imported to the migration destination is complete.
                                              • When a relational database, Hive, DLI, or MRS Hudi is used as the migration source, sample values cannot be obtained.
                                              • When SQLServer is the destination, fields of the timestamp type cannot be written. You must change their type (for example, to datetime) so that they can be written.
                                              • Column names are displayed when the source of the migration job is OBS, CSV files are to be migrated, and parameter Extract first row as columns is set to Yes.
                                              • Field mapping is not involved when the binary format is used to migrate files to files.
                                              • In the automatic table creation scenario, you need to manually add fields to the destination table in advance and then add fields to the field mapping.
                                              • After a field is added, its sample value is not displayed on the console. This does not affect the field value transmission. CDM directly writes the field value to the destination end.
                                              • If the field mapping is incorrect, you can adjust the field mapping by dragging fields or clicking to map fields in batches.
                                              • If the data is imported to DWS, you need to select the distribution columns in the destination fields. You are advised to select the distribution columns according to the following principles:
                                                1. Use the primary key as the distribution column.
                                                2. If multiple data segments are combined as primary keys, specify all primary keys as the distribution column.
                                                3. In the scenario where no primary key is available, if no distribution column is selected, DWS uses the first column as the distribution column by default. As a result, data skew risks exist.
                                              • If a source field type is not supported, convert the field type to a type supported by CDM by referring to Converting Unsupported Data Types.
                                            -

                                            Adding a Field

                                            You can click on the Map Field page and select Add to customize a new field. This field is usually used to mark the database source to ensure the integrity of the data imported to the migration destination.
                                            Figure 1 Field mapping
                                            +

                                            Adding a Field

                                            You can click on the Map Field page and select Add to customize a new field. This field is usually used to mark the database source to ensure the integrity of the data imported to the migration destination.
                                            Figure 1 Field mapping
                                            Currently, the following field types are supported:
                                            • Constant Parameter

                                              Constant parameters are fixed parameters and do not need to be reconfigured. For example, lable = friends is used to identify a constant value.

                                            • Variables

                                              You can use variables such as time macros, table name macros, and version macros to mark database source information. The variable syntax is ${variable}, where variable indicates a variable. For example, input_time = ${timestamp()} indicates the timestamp of the current time.

                                              @@ -15,7 +15,7 @@
                                            -

                                            Creating a Converter

                                            CDM supports field conversion. Click and then click Create Converter.
                                            Figure 2 Creating a converter
                                            +

                                            Creating a Converter

                                            CDM supports field conversion. Click and then click Create Converter.
                                            Figure 2 Creating a converter

                                            CDM can convert fields during migration. Currently, the following field converters are supported:

                                            • Anonymization
                                              This converter is used to hide key information about the character string. For example, if you want to convert 12345678910 to 123****8910, configure the parameters as follows:
                                              • Set Reserve Start Length to 3.
                                              • Set Reserve End Length to 4.
                                              • Set Replace Character to *.
                                              @@ -24,12 +24,12 @@
                                            • Reverse string

                                              This converter is used to automatically reverse a string. For example, reverse ABC into CBA. No parameters need to be configured.

                                            • Replace string

                                              This converter is used to replace a character string. You need to configure the object to be replaced and the new value.

                                            • Remove line break

                                              This converter is used to delete the newline characters, such as \n, \r, and \r\n from the field.

                                              -
                                            • Expression conversion

                                              This converter uses the JSP expression language (EL) to convert the current field or a row of data. The JSP EL is used to create arithmetic and logical expressions. Within a JSP EL expression, you can use integers, floating point numbers, strings, the built-in constants true and false for boolean values, and null.

                                              +
                                            • Expression conversion

                                              During data conversion, if the content to be replaced contains a special character, use a backslash (\) to escape the special character to a common one.

                                              • The expression supports the following environment variables:
                                                • value: indicates the current field value.
                                                • row: indicates the current row, which is an array type.
                                              • The expression supports the following Utils:
                                                1. If the field is of the string type, convert all character strings into lowercase letters, for example, convert aBC to abc.

                                                  Expression: StringUtils.lowerCase(value)

                                                2. Convert all character strings of the current field to uppercase letters.

                                                  Expression: StringUtils.upperCase(value)

                                                3. Convert the format of the first date field from 2018-01-05 15:15:05 to 20180105.

                                                  Expression: DateUtils.format(DateUtils.parseDate(row[0],"yyyy-MM-dd HH:mm:ss"),"yyyyMMdd")

                                                  -
                                                4. Convert a timestamp to a date string in yyyy-MM-dd hh:mm:ss format, for example, convert 1701312046588 to 2023-11-30 10:40:46.

                                                  Expression: DateUtils.format(NumberUtils.toLong(value),"yyyy-MM-dd HH:mm:ss")

                                                  +
                                                5. Convert a timestamp to a date string in yyyy-MM-dd hh:mm:ss format, for example, convert 1701312046588 to 2023-11-30 10:40:46.

                                                  Expression: DateUtils.format(NumberUtils.toLong(value),"yyyy-MM-dd HH:mm:ss")

                                                6. Convert a date string in the yyyy-MM-dd hh:mm:ss format to a timestamp.

                                                  Expression: DateUtils.getTime(DateUtils.parseDate(value,"yyyy-MM-dd hh:mm:ss"))

                                                7. If the field value is a date string in yyyy-MM-dd format, extract the year from the field value, for example, extract 2017 from 2017-12-01.

                                                  Expression: StringUtils.substringBefore(value,"-")

                                                8. If the field value is of the numeric type, convert the value to a new value which is two times greater than the original value:

                                                  Expression: value*2

                                                  @@ -68,12 +68,13 @@
                                                9. If the field is of the string type, remove the substring at the end of the field. If the specified substring is not at the end of the field, no conversion is performed. For example, remove .com at the end of www.domain.com.

                                                  Expression: StringUtils.removeEnd(value,".com")

                                                10. If the field is of the string type, delete the substring at the beginning of the field. If the specified substring is not at the beginning of the field, no conversion is performed. For example, delete www. at the beginning of www.domain.com.

                                                  Expression: StringUtils.removeStart(value,"www.")

                                                11. If the field is of the string type, replace all the specified character strings in the field. For example, replace a in aba with z to obtain zbz.

                                                  Expression: StringUtils.replace(value,"a","z")

                                                  +

                                                  If the content to be replaced contains a special character, the special character must be escaped to a common character. For example, if you want to delete \t from a string, use the following expression: StringUtils.replace(value,"\\t",""), which means escaping the backslash (\) again.

                                                12. If the field is of the string type, replace multiple characters in the character string at a time. For example, replace h in hello with j and o with y to obtain jelly.

                                                  Expression: StringUtils.replaceChars(value,"ho","jy")

                                                13. If the string starts with the specified prefix (case sensitive), true is returned; otherwise, false is returned. For example, abcdef starts with abc, so that true is returned.

                                                  Expression: StringUtils.startsWith(value,"abc")

                                                14. If the field is of the string type, delete all the specified characters at the beginning and end of the field. the field. For example, delete all x, y, z, and b from abcyx to obtain abc.

                                                  Expression: StringUtils.strip(value,"xyzb")

                                                  -
                                                15. If the field is of the string type, delete all the specified characters at the end of the field, for example, delete the abc string at the end of the field.

                                                  Expression: StringUtils.stripEnd(value,"abc")

                                                  +
                                                16. If the field is of the string type, delete all the specified characters at the end of the field, for example, delete the "abc" string at the end of the field.

                                                  Expression: StringUtils.stripEnd(value,"abc")

                                                17. If the field is of the string type, delete all the specified characters at the beginning of the field, for example, delete all spaces at the beginning of the field.

                                                  Expression: StringUtils.stripStart(value,null)

                                                  -
                                                18. If the field is of the string type, obtain the substring after the specified position (the index starts from 0, including the character at the specified position) of the character string. If the specified position is a negative number, calculate the position in the descending order. The first digit at the end is -1. For example, obtain the second character (c) of abcde and the string after it, that is, cde.

                                                  Expression: StringUtils.substring(value,2)

                                                  +
                                                19. If the field is of the string type, obtain the substring after the specified position (the index starts from 0, including the character at the specified position) of the character string. If the specified position is a negative number, calculate the position in the descending order. The first digit at the end is -1. For example, obtain the character whose index is 2 from abcde (that is, c) and the string after it, that is, cde.

                                                  Expression: StringUtils.substring(value,2)

                                                20. If the field is of the string type, obtain the substring in a specified range (the index starts from 0, including the character at the start and excluding the character at the end). If the range is a negative number, calculate the position in the descending order. The first digit at the end is -1. For example, obtain the string between the second character (c) and fourth character (e) of abcde, that is, cd.

                                                  Expression: StringUtils.substring(value,2,4)

                                                21. If the field is of the string type, obtain the substring after the first specified character. For example, obtain the substring after the first b in abcba, that is, cba.

                                                  Expression: StringUtils.substringAfter(value,"b")

                                                22. If the field is of the string type, obtain the substring after the last specified character. For example, obtain the substring after the last b in abcba, that is, a.

                                                  Expression: StringUtils.substringAfterLast(value,"b")

                                                  @@ -93,13 +94,13 @@
                                                23. Convert the character string to a value of the long type. If the conversion fails, the specified value, for example, 1L, is returned.

                                                  Expression: NumberUtils.toLong(value,1L)

                                                24. Convert the character string to a value of the short type. If the conversion fails, 0 is returned.

                                                  Expression: NumberUtils.toShort(value)

                                                25. Convert the character string to a value of the short type. If the conversion fails, the specified value, for example, 1, is returned.

                                                  Expression: NumberUtils.toShort(value,1)

                                                  -
                                                26. Convert the IP string to a value of the long type, for example, convert 10.78.124.0 to 172915712.

                                                  Expression: CommonUtils.ipToLong(value)

                                                  +
                                                27. Convert the IP string to a value of the long type, for example, convert 10.78.124.0 to 172915712.

                                                  Expression: CommonUtils.ipToLong(value)

                                                28. Read an IP address and physical address mapping file from the network, and download the mapping file to the map collection. url indicates the address for storing the IP mapping file, for example, http://10.114.205.45:21203/sqoop/IpList.csv.

                                                  Expression: HttpsUtils.downloadMap("url")

                                                29. Cache the IP address and physical address mappings and specify a key for retrieval, for example, ipList.

                                                  Expression: CommonUtils.setCache("ipList",HttpsUtils.downloadMap("url"))

                                                30. Obtain the cached IP address and physical address mappings.

                                                  Expression: CommonUtils.getCache("ipList")

                                                31. Check whether the IP address and physical address mappings are cached.

                                                  Expression: CommonUtils.cacheExists("ipList")

                                                32. Based on the specified offset type (month/day/hour/minute/second) and offset (positive number indicates increase and negative number indicates decrease), convert the time in the specified format to a new time, for example, add 8 hours to 2019-05-21 12:00:00.

                                                  Expression: DateUtils.getCurrentTimeByZone("yyyy-MM-dd HH:mm:ss",value, "hour", 8)

                                                  -
                                                33. If the value is empty or null, "aaa" is returned. Otherwise, value is returned.

                                                  Expression: StringUtils.defaultIfEmpty(value,"aaa")

                                                  +
                                                34. If the value is empty or null, "aaa" is returned. Otherwise, value is returned.

                                                  Expression: StringUtils.defaultIfEmpty(value,"aaa")

                                            @@ -109,7 +110,14 @@
                                            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0285.html b/docs/dataartsstudio/umn/dataartsstudio_01_0285.html index 08eee79ba..58d6e784b 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0285.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0285.html @@ -1,6 +1,6 @@ -

                                            Link to MRS ClickHouse

                                            +

                                            MRS ClickHouse Link Parameters

                                            Table 1 describes the MRS ClickHouse link parameters.

                                            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

                                            @@ -22,10 +22,10 @@

                                            Database Server

                                            IP address or domain name of the database to connect

                                            -

                                            Log in to Manager of the cluster where the MRS ClickHouse data source is located, choose Cluster > Services > ClickHouse > Instance, and view the ClickHouseServer service IP address.

                                            -
                                            NOTE:

                                            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                            +
                                            IP address or domain name of the database to connect
                                            NOTE:

                                            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                            +
                                            +

                                            Log in to Manager of the cluster where the MRS ClickHouse data source is located, choose Cluster > Services > ClickHouse > Instance, and view the ClickHouseServer service IP address.

                                            192.168.0.1

                                            This parameter indicates the WHERE clause to be extracted. If this parameter is not set, the entire table is extracted. If the table to be migrated does not contain the fields specified by the WHERE clause, the migration will fail.

                                            You can set a date macro variable to extract data generated on a specific date.

                                            -
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            +
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            age > 18 and age <= 60

                                            @@ -60,7 +60,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0287.html b/docs/dataartsstudio/umn/dataartsstudio_01_0287.html index ace7917cc..be11a6941 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0287.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0287.html @@ -26,7 +26,7 @@

                                            Destination table name.

                                            Click the icon next to the text box. The dialog box for selecting the table is displayed.

                                            This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                            -
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            +
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            table

                                            @@ -60,7 +60,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0288.html b/docs/dataartsstudio/umn/dataartsstudio_01_0288.html new file mode 100644 index 000000000..8e753c4ab --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0288.html @@ -0,0 +1,59 @@ + + +

                                            LogHub (SLS) Link Parameters

                                            +

                                            Table 1 describes the LogHub (SLS) link parameters.

                                            + +
                                            + + + + + + + + + + + + + + + + + + + + + + + + + +
                                            Table 1 LogHub (SLS) link parameters

                                            Parameter

                                            +

                                            Description

                                            +

                                            Example Value

                                            +

                                            Name

                                            +

                                            Link name

                                            +

                                            sls_link

                                            +

                                            EndPoint

                                            +

                                            URL for accessing a project and its logs

                                            +

                                            An endpoint is the request address for calling an API. Endpoints vary depending on services and regions. You can obtain the endpoints of the service from Regions and Endpoints.

                                            +

                                            -

                                            +

                                            Project

                                            +

                                            Project name of the target log service. It is a resource management unit in the log service and is used to isolate and control resources.

                                            +

                                            sls_project

                                            +

                                            AccessKeyID

                                            +

                                            Key for accessing the log service, which is used to identify a user

                                            +

                                            -

                                            +

                                            accessKeySecret

                                            +

                                            Key for accessing the log service, which is used to authenticate the user

                                            +

                                            -

                                            +
                                            +
                                            +
                                            +
                                            + +
                                            + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0289.html b/docs/dataartsstudio/umn/dataartsstudio_01_0289.html new file mode 100644 index 000000000..183e70085 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0289.html @@ -0,0 +1,60 @@ + + +

                                            From LogHub (SLS)

                                            +

                                            If the source link of a job is a LogHub (SLS) link, configure the source job parameters based on Table 1.

                                            + +
                                            + + + + + + + + + + + + + + + + + + + + + + + + + +
                                            Table 1 Parameter description

                                            Parameter

                                            +

                                            Description

                                            +

                                            Example Value

                                            +

                                            Source Link Name

                                            +

                                            LogHub (SLS) link

                                            +

                                            sls_link

                                            +

                                            LogStore

                                            +

                                            Name of the target logstore

                                            +

                                            -

                                            +

                                            BatchSize

                                            +

                                            Number of data records obtained from the log service at a time

                                            +

                                            128

                                            +

                                            BeginDateTime

                                            +

                                            Start time of data consumption, that is, the time when log data reaches LogHub (SLS). The value is a time string in yyyyMMddHHmmss format.

                                            +
                                            NOTE:

                                            This parameter must be used together with EndDateTime. The value range includes BeginDateTime and excludes EndDateTime.

                                            +
                                            +

                                            20220113013000

                                            +

                                            EndDateTime

                                            +

                                            End time of data consumption. The value is a string in yyyyMMddHHmmss format.

                                            +

                                            20220213013000

                                            +
                                            +
                                            +
                                            + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0290.html b/docs/dataartsstudio/umn/dataartsstudio_01_0290.html index 52bfb0aeb..bd058254c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0290.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0290.html @@ -1,6 +1,6 @@ -

                                            Link to a ShenTong Database

                                            +

                                            ShenTong Database Link Parameters

                                            Table 1 lists the parameters for a link to a ShenTong database.

                                            Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

                                            @@ -58,14 +58,14 @@

                                            Use Agent

                                            Whether to extract data from the data source through an agent

                                            +

                                            The agent function will be unavailable soon and does not need to be configured.

                                            Yes

                                            +

                                            -

                                            Agent

                                            Click Select and select the agent created in Managing Agents.

                                            +

                                            The agent function will be unavailable soon and does not need to be configured.

                                            -

                                            SQL Statement

                                            When Use SQL Statement is set to Yes, enter an SQL statement here. CDM exports data based on the SQL statement.

                                            -
                                            NOTE:
                                            • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                            • With statements are not supported.
                                            • Comments, such as -- and /*, are not supported.
                                            • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                              • load data
                                              • delete from
                                              • alter table
                                              • create table
                                              • drop table
                                              • into outfile
                                              -
                                            • Quote characters take effect only for SQL statements generated in the database table configuration, and cannot be added to custom SQL statements.
                                            +
                                            NOTE:
                                            • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                            • With statements are not supported.
                                            • Comments, such as -- and /*, are not supported.
                                            • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                              • load data
                                              • delete from
                                              • alter table
                                              • create table
                                              • drop table
                                              • into outfile
                                              +
                                            • If the SQL statement is too long, the request fails to be delivered. If you continue to create a job, the system displays an error message indicating that the request is incorrect. In this case, you need to simplify or clear the SQL statement and try again.

                                            select id,name from sqoop.user;

                                            @@ -48,7 +48,7 @@

                                            Name of the table from which data will be extracted. This parameter is displayed when Use SQL Statement is set to No. Click the icon next to the text box to go to the page for selecting the table or directly enter a table name.

                                            If the desired table is not displayed, check whether the table exists or whether the login account has the permission to query metadata.

                                            This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                            -
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            +
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            NOTE:
                                            The table name can contain wildcard characters (*), which is used to export all tables whose names start with a certain prefix or end with a certain suffix. The number and types of fields in the tables must be the same. The examples are as follows:
                                            • table* indicates that all tables whose names starting with table are exported.
                                            • *table indicates that all tables whose names ending with table are exported.
                                            • *table* indicates that all tables whose names containing table are exported.
                                            @@ -75,7 +75,7 @@

                                            WHERE clause used to specify the data extraction range. This parameter is displayed when Use SQL Statement is set to No. If this parameter is not set, the entire table is extracted.

                                            You can set a date macro variable to extract data generated on a specific date.

                                            -
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            +
                                            NOTE:

                                            If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                            DS='${dateformat(yyyy-MM-dd,-1,DAY)}'

                                            @@ -94,7 +94,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0304.html b/docs/dataartsstudio/umn/dataartsstudio_01_0304.html index 421be3988..0a2967083 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0304.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0304.html @@ -1,8 +1,8 @@

                                            Adding Fields

                                            -

                                            Scenario

                                            • After job parameters are configured, field mapping needs to be configured. You can customize new fields by clicking on the Map Field page.
                                            • If files are migrated between FTP, SFTP, OBS, and HDFS and the migration source's File Format is set to Binary, files will be directly transferred, free from field mapping.
                                            • In other scenarios, CDM automatically maps fields of the source table and the destination table. You need to check whether the mapping and time format are correct. For example, check whether the source field type can be converted into the destination field type.
                                            -
                                            You can click on the Map Field page and select Add to customize a new field. This field is usually used to mark the database source to ensure the integrity of the data imported to the migration destination.
                                            Figure 1 Field mapping
                                            +

                                            Scenario

                                            • After job parameters are configured, field mapping needs to be configured. You can customize new fields by clicking on the Map Field page.
                                            • If files are migrated between FTP, SFTP, OBS, and HDFS and the migration source's File Format is set to Binary, files will be directly transferred, free from field mapping.
                                            • In other scenarios, CDM automatically maps fields of the source table and the destination table. You need to check whether the mapping and time format are correct. For example, check whether the source field type can be converted into the destination field type.
                                            +
                                            You can click on the Map Field page and select Add to customize a new field. This field is usually used to mark the database source to ensure the integrity of the data imported to the migration destination.
                                            Figure 1 Field mapping
                                            Currently, the following field types are supported:
                                            • Constant Parameter

                                              Constant parameters are fixed parameters and do not need to be reconfigured. For example, lable = friends is used to identify a constant value.

                                            • Variables

                                              You can use variables such as time macros, table name macros, and version macros to mark database source information. The variable syntax is ${variable}, where variable indicates a variable. For example, input_time = ${timestamp()} indicates the timestamp of the current time.

                                              @@ -10,7 +10,7 @@
                                            -

                                            Constraints

                                            • On the Map Field tab page, if CDM fails to obtain all columns by obtaining sample values (for example, when data is exported from HBase, CloudTable, or MongoDB, there is a high probability that CDM failed to obtain all columns), you can click and select Add a new field to add new fields to ensure that the data imported to the migration destination is complete.
                                            • When a relational database, Hive, DLI, or MRS Hudi is used as the migration source, sample values cannot be obtained.
                                            • When SQLServer is the destination, fields of the timestamp type cannot be written. You must change their type (for example, to datetime) so that they can be written.
                                            • Column names are displayed when the source of the migration job is OBS, CSV files are to be migrated, and parameter Extract first row as columns is set to Yes.
                                            • Field mapping is not involved when the binary format is used to migrate files to files.
                                            • In the automatic table creation scenario, you need to manually add fields to the destination table in advance and then add fields to the field mapping.
                                            • After a field is added, its sample value is not displayed on the console. This does not affect the field value transmission. CDM directly writes the field value to the destination end.
                                            • If the field mapping is incorrect, you can adjust the field mapping by dragging fields or clicking to map fields in batches.
                                            • If the data is imported to DWS, you need to select the distribution columns in the destination fields. You are advised to select the distribution columns according to the following principles:
                                              1. Use the primary key as the distribution column.
                                              2. If multiple data segments are combined as primary keys, specify all primary keys as the distribution column.
                                              3. In the scenario where no primary key is available, if no distribution column is selected, DWS uses the first column as the distribution column by default. As a result, data skew risks exist.
                                              +

                                              Constraints

                                              • On the Map Field tab page, if CDM fails to obtain all columns by obtaining sample values (for example, when data is exported from HBase, CloudTable, or MongoDB, there is a high probability that CDM failed to obtain all columns), you can click and select Add a new field to add new fields to ensure that the data imported to the migration destination is complete.
                                              • When a relational database, Hive, DLI, or MRS Hudi is used as the migration source, sample values cannot be obtained.
                                              • When SQLServer is the destination, fields of the timestamp type cannot be written. You must change their type (for example, to datetime) so that they can be written.
                                              • Column names are displayed when the source of the migration job is OBS, CSV files are to be migrated, and parameter Extract first row as columns is set to Yes.
                                              • Field mapping is not involved when the binary format is used to migrate files to files.
                                              • In the automatic table creation scenario, you need to manually add fields to the destination table in advance and then add fields to the field mapping.
                                              • After a field is added, its sample value is not displayed on the console. This does not affect the field value transmission. CDM directly writes the field value to the destination end.
                                              • If the field mapping is incorrect, you can adjust the field mapping by dragging fields or clicking to map fields in batches.
                                              • If the data is imported to DWS, you need to select the distribution columns in the destination fields. You are advised to select the distribution columns according to the following principles:
                                                1. Use the primary key as the distribution column.
                                                2. If multiple data segments are combined as primary keys, specify all primary keys as the distribution column.
                                                3. In the scenario where no primary key is available, if no distribution column is selected, DWS uses the first column as the distribution column by default. As a result, data skew risks exist.
                                              • If a source field type is not supported, convert the field type to a type supported by CDM by referring to Converting Unsupported Data Types.
                                            @@ -20,3 +20,10 @@
                                            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0332.html b/docs/dataartsstudio/umn/dataartsstudio_01_0332.html index 5e556a8ca..10ecb1189 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0332.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0332.html @@ -49,7 +49,7 @@
                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0350.html b/docs/dataartsstudio/umn/dataartsstudio_01_0350.html index add767b84..54ccf948d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0350.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0350.html @@ -1,18 +1,15 @@ - -

                                            Tutorials

                                            - -

                                            +

                                            Typical Scenarios for Using Management Center

                                            +

                                            -
                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0351.html b/docs/dataartsstudio/umn/dataartsstudio_01_0351.html index 1ab748222..443a6272c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0351.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0351.html @@ -1,18 +1,18 @@ -

                                            Creating an MRS Hive Connection

                                            +

                                            Creating a Connection Between DataArts Studio and an MRS Hive Data Lake

                                            This section describes how to create an MRS Hive connection between DataArts Studio and the data lake base.

                                            -

                                            Prerequisites

                                            • You have created a data lake to connect, for example, a database or cloud service supported by DataArts Studio.
                                              • Before creating a DWS data connection, ensure that you have created a cluster in DWS and have the permissions required to view Key Management Service (KMS) keys.
                                              • Before creating an MRS connection such as an MRS HBase and MRS Hive connection, ensure that you have created an MRS cluster and selected required components.
                                              -
                                            • The data lake to connect communicates with the DataArts Studio instance properly.
                                              • If the data lake is an on-premises database, a public network or a dedicated connection is required. Ensure that the host where the data source is located can access the public network and the port has been enabled in the firewall rule.
                                              • If the data lake is a cloud service (such as DWS and MRS), the following requirements must be met for network interconnection:
                                                • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and the cloud service are in different regions, you need to enable the communications between them through the Internet or a Direct Connect connection.
                                                • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                • The cloud service instance and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                +

                                                Prerequisites

                                                • You have created a data lake to connect, for example, a database or cloud service supported by DataArts Studio.
                                                  • Before creating a DWS data connection, ensure that you have created a cluster in DWS and have the permissions required to view Key Management Service (KMS) keys.
                                                  • Before creating an MRS connection such as an MRS HBase or MRS Hive connection, ensure that you have created an MRS cluster whose Kerberos encryption type is aes256-sha1,aes128-sha1, and that the cluster contains required components.
                                                  +
                                                • You have obtained the required agent (CDM cluster). If no CDM cluster is available, create one by referring to Creating a CDM Cluster. The CDM cluster can communicate with the data lake to be connected.
                                                  • If the data lake is an on-premises database, you need the Internet or Direct Connect. Ensure that the host where the data source is located and the CDM cluster can access the Internet, and the connection port has been enabled in the firewall rule.
                                                  • If the data lake is a cloud service (such as DWS and MRS), the following requirements must be met for network interconnection:
                                                    • If the CDM cluster and the cloud service are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service.
                                                    • If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                    • The cloud service instance and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                  -
                                                • If the enterprise mode is used, pay attention to the following points:
                                                  In enterprise mode, the development environment and production environment need to be distinguished. Therefore, you need to prepare two sets of data lake services for the production environment and development environment to isolate the development environment from the production environment.
                                                  • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, DIS, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a Data Connection.
                                                  • For serverless services (such as DLI), you can configure the mapping between data lake services in the production environment and those in the development environment through environment isolation in Management Center. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.
                                                  • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                  +
                                                • If the enterprise mode is used, pay attention to the following points:
                                                  In enterprise mode, the development environment and production environment need to be distinguished. Therefore, you need to prepare two sets of data lake services for the production environment and development environment to isolate the development environment from the production environment.
                                                  • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a DataArts Studio Data Connection.
                                                  • For serverless services (such as DLI), DataArts Studio configures the mapping between data lake services in the production environment and development environment through environment isolation in the management center. The corresponding data lake is automatically switched during the development and production processes. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.
                                                  • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                  • Offline processing migration jobs are not supported in enterprise mode.

                                                  For example, if your data lake service is an MRS cluster, you need to prepare two MRS clusters with the same version, specifications, components, region, VPC, and subnet. If some configurations of an MRS cluster are modified, you also need to synchronize the modifications to the other MRS cluster.

                                                -

                                                Creating a Data Connection

                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                3. On the displayed Manage Data Connections page, click Create Data Connection.

                                                  Figure 1 Creating a data connection
                                                  +

                                                  Creating a Data Connection

                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                  2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                  3. On the displayed Manage Data Connections page, click Create Data Connection.

                                                    Figure 1 Creating a data connection

                                                    -

                                                  4. On the Manage Data Connections page, click Create Data Connection. On the displayed page, select MRS Hive for Data Connection Type and set other parameters based on the descriptions in Table 1.

                                                    Figure 2 MRS Hive connection parameters
                                                    +

                                                  5. On the Manage Data Connections page, click Create Data Connection. On the displayed page, select MRS Hive for Data Connection Type and set other parameters based on the descriptions in Table 1.

                                                    Figure 2 MRS Hive connection parameters

                                                    @@ -28,10 +28,10 @@

                                            Yes

                                            MRS Hive is selected by default and cannot be changed.

                                            +

                                            MRS Hive is selected by default and cannot be changed.

                                            Data Connection Name

                                            +

                                            Name

                                            Yes

                                            Yes

                                            Select the modules for which this connection is available. The connection can be used in the selected modules.

                                            -

                                            All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                            +

                                            Select the modules for which this connection is available.

                                            Basic and Network Connectivity Configuration

                                            +

                                            Basic and Network Connectivity Configuration

                                            Connection Type

                                            Yes

                                            Connection type. Proxy connection is recommended.
                                            • Proxy connection: An agent (CDM cluster) is used to access MRS clusters. This method supports all versions of MRS clusters.
                                            • MRS API connection: MRS APIs are used to access MRS clusters. This method supports only MRS clusters of the 2.X or a later version.

                                              When you select MRS API connection, pay attention to the following restrictions:

                                              +
                                            Connection type. Proxy connection is recommended.
                                            • Proxy connection: An agent (CDM cluster) is used to access MRS clusters. This method supports all versions of MRS clusters.
                                            • MRS API connection: MRS APIs are used to access MRS clusters. This method supports only MRS clusters of the 2.X or a later version.

                                              When you select MRS API connection, pay attention to the following restrictions:

                                              1. In DataArts Factory, you cannot view or manage the databases, data tables, and fields of the connection in a visualized manner. If an MRS cluster of version 3.2.1 or later is connected, you can view rather than manage the databases, data tables, and fields of the connection in a visualized manner.
                                              2. When the SQL editor of DataArts Factory is used to run SQL statements, the execution results can be displayed only in logs.
                                            -
                                            NOTE:

                                            Select Proxy connection for Connection Type so that the DataArts Architecture, DataArts Quality, DataArts Catalog, and DataArts DataService components can use the MRS connection.

                                            +
                                            NOTE:

                                            Select Proxy connection for Connection Type so that the DataArts Architecture, DataArts Quality, DataArts Catalog, and DataArts DataService components can use the MRS connection.

                                            Yes

                                            This parameter is mandatory when Connection Type is set to Proxy connection.

                                            -
                                            Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                            • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                            • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.
                                            +

                                            This parameter is mandatory when Connection Type is set to Proxy connection.

                                            +
                                            Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                            • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                            • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.

                                            Yes

                                            This parameter is mandatory when Connection String Mode is selected for Manual.

                                            -

                                            Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.

                                            -

                                            You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to the Management Node" in MapReduce Service (MRS) x.x.x User Guide.

                                            -
                                            Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                            • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                            • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.
                                            +

                                            This parameter is mandatory when Connection String Mode is selected for Manual.

                                            +
                                            Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                            NOTE:

                                            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                            +
                                            +
                                            +

                                            You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to an MRS Cluster Node" in MapReduce Service (MRS) x.x.x User Guide.

                                            +
                                            Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                            • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                            • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.

                                            Yes

                                            This parameter is mandatory when MRS API connection is selected for Connection Type or Cluster Name Mode is selected for Manual.

                                            -

                                            MRS cluster that Flink Server belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.

                                            -
                                            If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                            • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and the MRS cluster are in different regions, you need to enable the communications between them through the Internet or a Direct Connect connection. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                            • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                            • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                            +

                                            This parameter is mandatory when MRS API connection is selected for Connection Type or Cluster Name Mode is selected for Manual.

                                            +
                                            The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                            NOTE:

                                            DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                            +
                                            +
                                            +
                                            If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                            • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                            • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                            • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                            +
                                            NOTE:

                                            If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                            +

                                            No

                                            This parameter is mandatory when Connection Type is set to Proxy connection.

                                            -

                                            KMS key used to encrypt and decrypt the authentication information for the data source

                                            +

                                            This parameter is mandatory when Connection Type is set to Proxy connection.

                                            +
                                            KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                            NOTE:
                                            • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                            • Only symmetric keys are supported. Asymmetric keys are not supported.
                                            +
                                            +

                                            Agent

                                            Yes

                                            This parameter is mandatory when Connection Type is set to Proxy connection.

                                            -

                                            MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first.

                                            -

                                            As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the MRS cluster. The security group rule must also allow the CDM cluster communicate with the MRS cluster.

                                            -
                                            NOTE:
                                            • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster cannot connect to multiple MRS security clusters. You are advised to plan multiple agents which are mapped to MRS security clusters one by one.
                                            • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.
                                            +

                                            This parameter is mandatory when Connection Type is set to Proxy connection.

                                            +

                                            MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                            +

                                            As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the MRS cluster. The security group rule must also allow the CDM cluster to communicate with the MRS cluster.

                                            +
                                            NOTE:
                                            • If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                            • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                              +

                                            Data Source Authentication and Other Function Configuration

                                            +

                                            Data Source Authentication and Other Function Configuration

                                            Authentication Method

                                            Yes

                                            This parameter is mandatory when Connection String Mode is selected for Manual.

                                            -
                                            Authentication method used for accessing MRS
                                            • SIMPLE: Select this for non-security mode.
                                            • KERBEROS: Select this for security mode.
                                            +

                                            This parameter is mandatory when Connection String Mode is selected for Manual.

                                            +
                                            It specifies the authentication method used for accessing the MRS cluster. The following options are available:
                                            • SIMPLE: for non-security mode
                                            • KERBEROS: for security mode

                                            Yes

                                            Human-machine user of the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection. If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                            -
                                            To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                            NOTE:
                                            • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                            • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                            • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                            • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                            +

                                            Human-machine user of the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection. If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                            +
                                            To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                            NOTE:
                                            • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                            • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                            • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                            • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.

                                            Yes

                                            The password for accessing the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection.

                                            +

                                            The password for accessing the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection.

                                            Enable ldap

                                            No

                                            This parameter is available when Connection Type is set to Proxy connection.

                                            +

                                            This parameter is available when Connection Type is set to Proxy connection.

                                            If LDAP authentication is enabled for an external LDAP server connected to MRS Hive, the LDAP username and password are required for authenticating the connection to MRS Hive. In this case, this option must be enabled. Otherwise, the connection will fail.

                                            Yes

                                            This parameter is mandatory when Enable ldap is enabled.

                                            +

                                            This parameter is mandatory when Enable ldap is enabled.

                                            Enter the username configured when LDAP authentication was enabled for MRS Hive.

                                            Yes

                                            This parameter is mandatory when Enable ldap is enabled.

                                            +

                                            This parameter is mandatory when Enable ldap is enabled.

                                            Enter the password configured when LDAP authentication was enabled for MRS Hive.

                                            OBS storage support

                                            +

                                            No

                                            +

                                            This parameter is displayed when DataArts Migration is selected for Applicable Modules.

                                            +

                                            The server must support OBS storage. When creating a Hive table, you can store the table in OBS.

                                            +

                                            Use Agency

                                            +

                                            No

                                            +

                                            This parameter is displayed when DataArts Migration is selected for Applicable Modules.

                                            +

                                            If you enable the agency function, you can create a data connection without having a permanent AK/SK and execute CDM jobs using the scheduling identity configured in DataArts Factory.

                                            +

                                            Public agency

                                            +

                                            No

                                            +

                                            This parameter is displayed when DataArts Migration is selected for Applicable Modules and Use Agency is enabled.

                                            +

                                            The agency is only used to check whether the connection agency function is normal. CDM jobs will be executed using the scheduling identity configured in DataArts Factory.

                                            +

                                            AK

                                            +

                                            N/A

                                            +

                                            This parameter is displayed when DataArts Migration is selected for Applicable Modules and OBS storage support is enabled.

                                            +

                                            AK and SK are used to log in to the OBS server.

                                            +

                                            You need to create an access key for the current account and obtain an AK/SK pair.

                                            +
                                            To obtain an access key, perform the following steps:
                                            1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                            2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 3.
                                              Figure 3 Clicking Create Access Key
                                              +
                                            3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                                              NOTE:
                                              • Only two access keys can be added for each user.
                                              • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
                                              +
                                              +
                                            +
                                            +

                                            +

                                            SK

                                            +

                                            N/A

                                            +
                                            -

                                          6. Click Test to test connectivity of the data connection. If the test fails, the data connection fails to be created.
                                          7. After the test is successful, click OK to create the data connection.
                                          8. +

                                          9. Click Test to test connectivity of the data connection. If the test fails, the data connection fails to be created.
                                          10. After the test is successful, click Save to create the data connection.
                                          11. -

                                            Reference

                                            1. Why is no MRS Hive cluster displayed on the Create Data Connection page?
                                              Possible causes are as follows:
                                              • Hive/HBase components were not selected during MRS cluster creation.
                                              • The network between the CDM cluster and MRS cluster was disconnected when an MRS data connection is created.

                                                The CDM cluster functions as a network agent. MRS data connections that you are going to create need to communicate with CDM.

                                                +

                                                Reference

                                                1. Why is no MRS Hive cluster displayed on the Create Data Connection page?
                                                  Possible causes are as follows:
                                                  • Hive/HBase components were not selected during MRS cluster creation.
                                                  • The enterprise project selected during MRS cluster creation is different from that in the workspace.
                                                  • The network between the CDM cluster and MRS cluster was disconnected when an MRS data connection is created.

                                                    The CDM cluster functions as a network agent. MRS data connections that you are going to create need to communicate with CDM.

                                                2. Why does a Hive data connection fail to obtain information about databases or tables?

                                                  The possible cause is that the CDM cluster is stopped or a concurrency conflict occurs. You can switch to another agent to temporarily avoid this issue.

                                                  @@ -186,7 +238,14 @@
                                                + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0352.html b/docs/dataartsstudio/umn/dataartsstudio_01_0352.html index 1594a8d25..32b329e90 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0352.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0352.html @@ -1,18 +1,18 @@ -

                                                Creating a DWS Connection

                                                +

                                                Creating a Connection Between DataArts Studio and a GaussDB(DWS) Data Lake

                                                This section describes how to create a DWS connection between DataArts Studio and the data lake base.

                                                -

                                                Prerequisites

                                                • You have created a data lake to connect, for example, a database or cloud service supported by DataArts Studio.
                                                  • Before creating a DWS data connection, ensure that you have created a cluster in DWS and have the permissions required to view Key Management Service (KMS) keys.
                                                  • Before creating an MRS connection such as an MRS HBase and MRS Hive connection, ensure that you have created an MRS cluster and selected required components.
                                                  -
                                                • The data lake to connect communicates with the DataArts Studio instance properly.
                                                  • If the data lake is an on-premises database, a public network or a dedicated connection is required. Ensure that the host where the data source is located can access the public network and the port has been enabled in the firewall rule.
                                                  • If the data lake is a cloud service (such as DWS and MRS), the following requirements must be met for network interconnection:
                                                    • If the CDM cluster in the DataArts Studio instance and the cloud service are in different regions, a public network or a dedicated connection is required.
                                                    • If the CDM cluster in the DataArts Studio instance and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                    • The cloud service instance and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                    +

                                                    Prerequisites

                                                    • You have created a data lake to connect, for example, a database or cloud service supported by DataArts Studio.
                                                      • Before creating a DWS data connection, ensure that you have created a cluster in DWS and have the permissions required to view Key Management Service (KMS) keys.
                                                      • Before creating an MRS connection such as an MRS HBase or MRS Hive connection, ensure that you have created an MRS cluster whose Kerberos encryption type is aes256-sha1,aes128-sha1, and that the cluster contains required components.
                                                      +
                                                    • You have obtained the required agent (CDM cluster). If no CDM cluster is available, create one by referring to Creating a CDM Cluster. The CDM cluster can communicate with the data lake to be connected.
                                                      • If the data lake is an on-premises database, you need the Internet or Direct Connect. Ensure that the host where the data source is located and the CDM cluster can access the Internet, and the connection port has been enabled in the firewall rule.
                                                      • If the data lake is a cloud service (such as DWS and MRS), the following requirements must be met for network interconnection:
                                                        • If the CDM cluster and the cloud service are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service.
                                                        • If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                        • The cloud service instance and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                      -
                                                    • If the enterprise mode is used, pay attention to the following points:
                                                      In enterprise mode, the development environment and production environment need to be distinguished. Therefore, you need to prepare two sets of data lake services for the production environment and development environment to isolate the development environment from the production environment.
                                                      • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, DIS, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a Data Connection.
                                                      • For serverless services (such as DLI), DataArts Studio configures the mapping between data lake services in the production environment and development environment through environment isolation in the management center. The corresponding data lake is automatically switched during the development and production processes. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.
                                                      • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                      +
                                                    • If the enterprise mode is used, pay attention to the following points:
                                                      In enterprise mode, the development environment and production environment need to be distinguished. Therefore, you need to prepare two sets of data lake services for the production environment and development environment to isolate the development environment from the production environment.
                                                      • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a DataArts Studio Data Connection.
                                                      • For serverless services (such as DLI), DataArts Studio configures the mapping between data lake services in the production environment and development environment through environment isolation in the management center. The corresponding data lake is automatically switched during the development and production processes. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.
                                                      • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                      • Offline processing migration jobs are not supported in enterprise mode.

                                                      For example, if your data lake service is an MRS cluster, you need to prepare two MRS clusters with the same version, specifications, components, region, VPC, and subnet. If some configurations of an MRS cluster are modified, you also need to synchronize the modifications to the other MRS cluster.

                                                    -

                                                    Creating a Data Connection

                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                    2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                    3. On the displayed Manage Data Connections page, click Create Data Connection.

                                                      Figure 1 Creating a data connection
                                                      +

                                                      Creating a Data Connection

                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                      2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                      3. On the displayed Manage Data Connections page, click Create Data Connection.

                                                        Figure 1 Creating a data connection

                                                        -

                                                      4. On the Manage Data Connections page, click Create Data Connection. On the displayed page, select DWS for Data Connection Type and set other parameters based on the descriptions in Table 1.

                                                        Figure 2 DWS connection parameters
                                                        +

                                                      5. On the Manage Data Connections page, click Create Data Connection. On the displayed page, select DWS for Data Connection Type and set other parameters based on the descriptions in Table 1.

                                                        Figure 2 DWS connection parameters

                                                        @@ -52,7 +52,6 @@

                                            Yes

                                            Select the modules for which this connection is available.

                                            -

                                            All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                            Basic and Network Connectivity Configuration

                                            @@ -62,7 +61,8 @@

                                            Yes

                                            DWS supports SSL encryption and certificate authentication for communication between the client and server. You can use SSL Connection to set the communication mode. If SSL Connection is enabled, only SSL encryption can be used. If SSL Connection is disabled, both modes can be used. This function is disabled by default.

                                            +
                                            DWS supports SSL encryption and certificate authentication for communication between the client and server. You can set this parameter based on whether SSL connection is mandatory on the server.
                                            • If this parameter is enabled, only SSL encryption can be used for communication.
                                            • If this parameter is disabled, both SSL encryption and certificate authentication can be used for communication.
                                            +

                                            Manual

                                            @@ -71,6 +71,8 @@

                                            Select either of the following modes:

                                            • Cluster Name Mode: Select an existing cluster.
                                            • Connection String Mode: Enter the IP address/domain name and port of the corresponding cluster and enable the communication between the connection's agent (CDM cluster) and the DWS cluster.
                                            +
                                            NOTE:

                                            DataArts Security does not support GaussDB(DWS) connections in connection string mode.

                                            +

                                            DWS Cluster Name

                                            @@ -86,6 +88,7 @@

                                            Yes

                                            This parameter is mandatory when Manual is set to Connection String Mode.

                                            +

                                            If you choose to manually enter an IP address or domain name, you must enter an internal IP address and a port that is accessible to the network segment of the resource group. Otherwise, the network is disconnected.

                                            This parameter indicates the address for accessing the cluster database through an internal network. Enter an IP address or domain name. The IP address or domain name is automatically generated during cluster creation. You can obtain them on the management console by performing the following operations:
                                            1. Log in to the GaussDB(DWS) console.
                                            2. In the left navigation pane, choose Instances.
                                            3. Click the name of an instance to enter the basic information page. In the Connection Information area, you can obtain the private IP address, domain name, and port number.

                                            Yes

                                            KMS key used to encrypt and decrypt the authentication information for the data source

                                            +
                                            KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                            NOTE:
                                            • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                            • Only symmetric keys are supported. Asymmetric keys are not supported.
                                            +
                                            +

                                            Agent

                                            Yes

                                            Data Warehouse Service (DWS) is not a fully managed service and thus cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating a DWS data connection. If no CDM cluster is available, create one first.

                                            -

                                            As a network proxy, the CDM cluster must be able to communicate with the DWS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the DWS cluster. The security group rule must also allow the CDM cluster communicate with the DWS cluster.

                                            +

                                            Data Warehouse Service (DWS) is not a fully managed service and thus cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating a DWS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                            +

                                            As a network proxy, the CDM cluster must be able to communicate with the DWS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the DWS cluster. The security group rule must also allow the CDM cluster communicate with the DWS cluster.

                                            NOTE:

                                            If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                            -

                                          12. Click Test to test connectivity of the data connection. If the test fails, the data connection fails to be created.
                                          13. After the test is successful, click OK to create the data connection.
                                          14. +

                                          15. Click Test to test connectivity of the data connection. If the test fails, the data connection fails to be created.
                                          16. After the test is successful, click Save to create the data connection.
                                          17. -

                                            Reference

                                            1. What should I do if the connection test fails when I enable the SSL connection during the creation of a DWS data connection?
                                              The failure may be caused by the rights separation function of the DWS cluster. On the DWS console, click the corresponding cluster, choose Security Settings, and disable Rights Separation.
                                              Figure 3 Disabling Rights Separation for the DWS cluster
                                              +

                                              Reference

                                              1. What should I do if the connection test fails when I enable the SSL connection during the creation of a DWS data connection?
                                                On the DWS console, click the corresponding cluster, choose Security Settings, and disable Rights Separation.
                                                Figure 3 Disabling Rights Separation for the DWS cluster
                                              2. Why does a DWS data connection fail to obtain information about databases or tables?

                                                The possible cause is that the CDM cluster is stopped or a concurrency conflict occurs. You can switch to another agent to temporarily avoid this issue.

                                              @@ -145,7 +150,14 @@
                                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0353.html b/docs/dataartsstudio/umn/dataartsstudio_01_0353.html index b59a61398..c825835a1 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0353.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0353.html @@ -1,20 +1,20 @@ -

                                              Creating a MySQL Connection

                                              +

                                              Creating a Connection Between DataArts Studio and a MySQL Database

                                              This section describes how to create a MySQL connection between DataArts Studio and the data lake base.

                                              -

                                              Prerequisites

                                              • You have created a data lake to connect, for example, a database or cloud service supported by DataArts Studio.
                                                • Before creating a DWS data connection, ensure that you have created a cluster in DWS and have the permissions required to view Key Management Service (KMS) keys.
                                                • Before creating an MRS connection such as an MRS HBase and MRS Hive connection, ensure that you have created an MRS cluster and selected required components.
                                                -
                                              • The data lake to connect communicates with the DataArts Studio instance properly.
                                                • If the data lake is an on-premises database, a public network or a dedicated connection is required. Ensure that the host where the data source is located can access the public network and the port has been enabled in the firewall rule.
                                                • If the data lake is a cloud service (such as DWS and MRS), the following requirements must be met for network interconnection:
                                                  • If the CDM cluster in the DataArts Studio instance and the cloud service are in different regions, a public network or a dedicated connection is required.
                                                  • If the CDM cluster in the DataArts Studio instance and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                  • The cloud service instance and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                  +

                                                  Prerequisites

                                                  • You have created a data lake to connect, for example, a database or cloud service supported by DataArts Studio.
                                                    • Before creating a DWS data connection, ensure that you have created a cluster in DWS and have the permissions required to view Key Management Service (KMS) keys.
                                                    • Before creating an MRS connection such as an MRS HBase or MRS Hive connection, ensure that you have created an MRS cluster whose Kerberos encryption type is aes256-sha1,aes128-sha1, and that the cluster contains required components.
                                                    +
                                                  • You have obtained the required agent (CDM cluster). If no CDM cluster is available, create one by referring to Creating a CDM Cluster. The CDM cluster can communicate with the data lake to be connected.
                                                    • If the data lake is an on-premises database, you need the Internet or Direct Connect. Ensure that the host where the data source is located and the CDM cluster can access the Internet, and the connection port has been enabled in the firewall rule.
                                                    • If the data lake is a cloud service (such as DWS and MRS), the following requirements must be met for network interconnection:
                                                      • If the CDM cluster and the cloud service are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service.
                                                      • If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                      • The cloud service instance and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                    -
                                                  • If the enterprise mode is used, pay attention to the following points:
                                                    In enterprise mode, the development environment and production environment need to be distinguished. Therefore, you need to prepare two sets of data lake services for the production environment and development environment to isolate the development environment from the production environment.
                                                    • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, DIS, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a Data Connection.
                                                    • For serverless services (such as DLI), DataArts Studio configures the mapping between data lake services in the production environment and development environment through environment isolation in the management center. The corresponding data lake is automatically switched during the development and production processes. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.
                                                    • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                    +
                                                  • If the enterprise mode is used, pay attention to the following points:
                                                    In enterprise mode, the development environment and production environment need to be distinguished. Therefore, you need to prepare two sets of data lake services for the production environment and development environment to isolate the development environment from the production environment.
                                                    • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a DataArts Studio Data Connection.
                                                    • For serverless services (such as DLI), DataArts Studio configures the mapping between data lake services in the production environment and development environment through environment isolation in the management center. The corresponding data lake is automatically switched during the development and production processes. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.
                                                    • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                    • Offline processing migration jobs are not supported in enterprise mode.

                                                    For example, if your data lake service is an MRS cluster, you need to prepare two MRS clusters with the same version, specifications, components, region, VPC, and subnet. If some configurations of an MRS cluster are modified, you also need to synchronize the modifications to the other MRS cluster.

                                                  -

                                                  Creating a Data Connection

                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                  2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                  3. On the displayed Manage Data Connections page, click Create Data Connection.

                                                    Figure 1 Creating a data connection
                                                    +

                                                    Creating a Data Connection

                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                    2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                    3. On the displayed Manage Data Connections page, click Create Data Connection.

                                                      Figure 1 Creating a data connection

                                                    4. On the Manage Data Connections page, click Create Data Connection. On the displayed page, select RDS for Data Connection Type and set other parameters based on the descriptions in Table 1.

                                                      • You are not advised to select MySQL (pending offline) for Data Connection Type. Instead, You are advised to select RDS.
                                                      • RDS data connections depend on OBS. If OBS is unavailable in the same region as DataArts Studio, RDS data connections are not supported.
                                                      -
                                                      Figure 2 RDS connection parameters
                                                      +
                                                      Figure 2 RDS connection parameters

                                                      @@ -54,7 +54,6 @@

                                            Yes

                                            Select the modules for which this connection is available.

                                            -

                                            All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                            Basic and Network Connectivity Configuration

                                            @@ -64,7 +63,8 @@

                                            Yes

                                            Address for accessing the relational database data source. The value can be an IP address or a domain name.

                                            +

                                            Address for accessing the relational database data source. The value can be an IP address or a domain name.

                                            +

                                            If you choose to manually enter an IP address or domain name, you must enter an internal IP address and a port that is accessible to the network segment of the resource group. Otherwise, the network is disconnected.

                                            • If the data source is RDS, you can obtain the address on the management console by performing the following operations:
                                              1. Log in to the management console of the corresponding cloud service using the account you have obtained.
                                              2. In the left navigation pane, choose Instances.
                                              3. Click the name of an instance to enter the basic information page. In the Connection Information area, you can obtain the private IP address, domain name, and port number.
                                            • If the data source is MySQL, PostgreSQL, or DM, you can obtain the access address from the database administrator.

                                            Cluster Mode

                                            +

                                            Yes

                                            +

                                            GaussDB cluster mode. This parameter is available when Driver Name is set to com.huawei.opengauss.jdbc.Driver.

                                            +
                                            • Primary/Standby
                                            • Distributed
                                            +

                                            KMS Key

                                            Yes

                                            KMS key used to encrypt and decrypt the authentication information for the data source

                                            +
                                            KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                            NOTE:
                                            • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                            • Only symmetric keys are supported. Asymmetric keys are not supported.
                                            +
                                            +

                                            Agent

                                            Yes

                                            RDS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an RDS data connection. If no CDM cluster is available, create one first.

                                            -

                                            As a network proxy, the CDM cluster must be able to communicate with RDS. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as RDS. The security group rule must also allow the CDM cluster to communicate with RDS.

                                            +

                                            RDS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an RDS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                            +

                                            As a network proxy, the CDM cluster must be able to communicate with RDS. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as RDS. The security group rule must also allow the CDM cluster to communicate with RDS.

                                            NOTE:

                                            If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                            SSL Encryption

                                            +

                                            No

                                            +

                                            Whether to enable SSL encrypted transmission.

                                            +

                                            Data Source Driver Configuration

                                            Yes

                                            The name of the driver. The following values are available:

                                            -
                                            • com.mysql.jdbc.Driver: Select this driver name for RDS for MySQL or MySQL.
                                            • org.postgresql.Driver: Select this driver name for RDS for PostgreSQL or PostgreSQL.
                                            • com.microsoft.sqlserver.jdbc.SQLServerDriver: Select this driver name for RDS for SQL Server.
                                            +
                                            • com.mysql.jdbc.Driver: Select this driver name for RDS for MySQL or MySQL.
                                            • org.postgresql.Driver: Select this driver name for RDS for PostgreSQL or PostgreSQL.
                                            • com.microsoft.sqlserver.jdbc.SQLServerDriver: Select this driver name for RDS for SQL Server.
                                            • com.huawei.opengauss.jdbc.Driver: Select this driver name for RDS for GaussDB.
                                            +

                                            Driver file source

                                            +

                                            Yes

                                            +

                                            Select the source of the driver file.

                                            Driver File Path

                                            @@ -111,7 +135,7 @@

                                            Yes

                                            It specifies the OBS path where the driver file is located. You need to download a .jar driver file from the corresponding official website and upload it to OBS.

                                            - +
                                            NOTE:
                                            • The OBS path of the driver file cannot contain Chinese characters.
                                            • To update the driver, you must restart the CDM cluster in DataArts Migration and then edit the data connection to upload the driver.
                                            -

                                          18. Click Test to test connectivity of the data connection. If the test fails, the data connection fails to be created.
                                          19. After the test is successful, click OK to create the data connection.
                                          +

                                        2. Click Test to test connectivity of the data connection. If the test fails, the data connection fails to be created.
                                        3. After the test is successful, click Save to create the data connection.

                                        Reference

                                        1. What Are the Precautions for Creating an RDS Data Connection?

                                          When creating an RDS data connection, you need to bind an agent provided by the CDM cluster. Currently, a version of the CDM cluster earlier than 1.8.6 is not supported.

                                        @@ -144,7 +168,14 @@
                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0387.html b/docs/dataartsstudio/umn/dataartsstudio_01_0387.html index 675d30272..0e0d0ea38 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0387.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0387.html @@ -25,8 +25,8 @@

                                      SQL Statement

                                      When Use SQL Statement is set to Yes, enter an SQL statement here. CDM exports data based on the SQL statement.

                                      -
                                      NOTE:
                                      • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                      • With statements are not supported.
                                      • Comments, such as -- and /*, are not supported.
                                      • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                        • load data
                                        • delete from
                                        • alter table
                                        • create table
                                        • drop table
                                        • into outfile
                                        -
                                      +
                                      NOTE:
                                      • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                      • With statements are not supported.
                                      • Comments, such as -- and /*, are not supported.
                                      • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                        • load data
                                        • delete from
                                        • alter table
                                        • create table
                                        • drop table
                                        • into outfile
                                        +
                                      • If the SQL statement is too long, the request fails to be delivered. If you continue to create a job, the system displays an error message indicating that the request is incorrect. In this case, you need to simplify or clear the SQL statement and try again.

                                      select id,name from sqoop.user;

                                      @@ -48,7 +48,7 @@

                                      Name of the table from which data will be extracted. This parameter is displayed when Use SQL Statement is set to No. Click the icon next to the text box to go to the page for selecting the table or directly enter a table name.

                                      If the desired table is not displayed, check whether the table exists or whether the login account has the permission to query metadata.

                                      This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                      -
                                      NOTE:

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      +
                                      NOTE:

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      NOTE:
                                      The table name can contain wildcard characters (*), which is used to export all tables whose names start with a certain prefix or end with a certain suffix. The number and types of fields in the tables must be the same. The examples are as follows:
                                      • table* indicates that all tables whose names starting with table are exported.
                                      • *table indicates that all tables whose names ending with table are exported.
                                      • *table* indicates that all tables whose names containing table are exported.
                                      @@ -68,7 +68,7 @@

                                      WHERE clause used to specify the data extraction range. This parameter is displayed when Use SQL Statement is set to No. If this parameter is not set, the entire table is extracted.

                                      You can set a date macro variable to extract data generated on a specific date.

                                      -
                                      NOTE:

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      +
                                      NOTE:

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      DS='${dateformat(yyyy-MM-dd,-1,DAY)}'

                                      @@ -134,7 +134,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0388.html b/docs/dataartsstudio/umn/dataartsstudio_01_0388.html index 688a8bcdd..18fbe9748 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0388.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0388.html @@ -25,8 +25,8 @@

                                      SQL Statement

                                      When Use SQL Statement is set to Yes, enter an SQL statement here. CDM exports data based on the SQL statement.

                                      -
                                      NOTE:
                                      • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                      • With statements are not supported.
                                      • Comments, such as -- and /*, are not supported.
                                      • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                        • load data
                                        • delete from
                                        • alter table
                                        • create table
                                        • drop table
                                        • into outfile
                                        -
                                      +
                                      NOTE:
                                      • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                      • With statements are not supported.
                                      • Comments, such as -- and /*, are not supported.
                                      • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                        • load data
                                        • delete from
                                        • alter table
                                        • create table
                                        • drop table
                                        • into outfile
                                        +
                                      • If the SQL statement is too long, the request fails to be delivered. If you continue to create a job, the system displays an error message indicating that the request is incorrect. In this case, you need to simplify or clear the SQL statement and try again.

                                      select id,name from sqoop.user;

                                      @@ -48,7 +48,7 @@

                                      Name of the table from which data will be extracted. This parameter is displayed when Use SQL Statement is set to No. Click the icon next to the text box to go to the page for selecting the table or directly enter a table name.

                                      If the desired table is not displayed, check whether the table exists or whether the login account has the permission to query metadata.

                                      This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                      -
                                      NOTE:

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      +
                                      NOTE:

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      NOTE:
                                      The table name can contain wildcard characters (*), which is used to export all tables whose names start with a certain prefix or end with a certain suffix. The number and types of fields in the tables must be the same. The examples are as follows:
                                      • table* indicates that all tables whose names starting with table are exported.
                                      • *table indicates that all tables whose names ending with table are exported.
                                      • *table* indicates that all tables whose names containing table are exported.
                                      @@ -64,7 +64,7 @@

                                      WHERE clause used to specify the data extraction range. This parameter is displayed when Use SQL Statement is set to No. If this parameter is not set, the entire table is extracted.

                                      You can set a date macro variable to extract data generated on a specific date.

                                      -
                                      NOTE:

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      +
                                      NOTE:

                                      If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                      DS='${dateformat(yyyy-MM-dd,-1,DAY)}'

                                      @@ -86,7 +86,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0401.html b/docs/dataartsstudio/umn/dataartsstudio_01_0401.html index 1257618f1..ad9010396 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0401.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0401.html @@ -4,7 +4,7 @@

                                      DataArts Factory is a one-stop big data collaborative development platform that provides fully managed big data scheduling capabilities. It manages various big data services, making big data more accessible than ever before and helping you effortlessly build big data processing centers.

                                      DataArts Factory used to be Data Lake Factory (DLF). Therefore, in this document, both Data Lake Factory and DLF can be used to refer to DataArts Factory.

                                      Introduction to DataArts Factory

                                      DataArts Factory enables a variety of operations such as data management, script development, job development, job scheduling, and monitoring, facilitating data analysis and processing.

                                      -
                                      Figure 1 DataArts Factory architecture
                                      +
                                      Figure 1 DataArts Factory architecture

                                      Main Functions

                                      - + + + +
                                      Table 1 Main functions of DataArts Factory

                                      Function

                                      @@ -59,3 +59,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0402.html b/docs/dataartsstudio/umn/dataartsstudio_01_0402.html index 0a530d98d..1896d7567 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0402.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0402.html @@ -1,11 +1,13 @@

                                      Data Management Process

                                      -
                                      The data management function helps you quickly establish data models and provides you with data entities for script and job development. With data management, you can:
                                      • Manage multiple types of data lakes, such as DWS, DLI, and MRS Hive.
                                      • Use the GUI and DDL to manage database tables. If an MRS API connection is used, you cannot view or manage the databases, data tables, and fields of the connection in a visualized manner.
                                      • Click to view the databases, data tables, and fields in the data connection directory tree. The directory tree is only available for DWS SQL, DLI SQL, and Hive connections using an agent.
                                      -
                                      -

                                      If you have created a data connection, a database, and a data table, you can skip this section and go to Script Development or Job Development.

                                      +
                                      The data management function helps you quickly establish data models and provides you with data entities for script and job development. With data management, you can:
                                      • Manage multiple types of data lakes, such as GaussDB(DWS), DLI and MRS Hive.
                                      • Use the GUI and DDL to manage database tables.

                                        If an MRS API connection is used, you cannot view or manage the databases, data tables, and fields of the connection in a visualized manner.

                                        -
                                        The following figure shows the process for using the data management function.
                                        Figure 1 Data management process
                                        +
                                      • Click to view the databases, data tables, and fields in the data connection directory tree. The directory tree is only available for DWS SQL, DLI SQL and MRS Hive SQL connections using an agent.
                                      +
                                      +

                                      If you have created a data connection and a corresponding database and data table before using DataArts Factory, you can skip data management operations and directly go to Script Development or Job Development.

                                      +
                                      +
                                      The following figure shows the process for using the data management function.
                                      Figure 1 Data management process
                                      1. Create a data connection to connect to a data lake base service. For details, see Creating a Data Connection.
                                      2. Create a database based on the service type. For details, see Creating a Database.
                                      3. If the connection type is DWS, create a database schema and a table. If the connection type is not DWS, create a table. For details, see (Optional) Creating a Database Schema.
                                      4. Create a table. For details, see Creating a Table.
                                      @@ -15,3 +17,10 @@
                                      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0404.html b/docs/dataartsstudio/umn/dataartsstudio_01_0404.html index 0daf2ad79..7b0f4095d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0404.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0404.html @@ -1,12 +1,12 @@

                                      Creating a Data Connection

                                      -

                                      After a data connection is created, you can perform data operations on DataArts Factory, for example, managing databases, namespaces, database schema, and tables.

                                      +

                                      After creating a data connection, you can perform data operations on DataArts Factory, for example, managing databases, namespaces, database schema, and tables.

                                      With one data connection, you can run multiple jobs and develop multiple scripts. If the connection information saved in the data connection changes, you only need to modify the corresponding information in Connection Management.

                                      -

                                      Creating a Data Connection

                                      The data connection of DataArts Factory is created based on the data connection of Management Center. For details about how to create a data connection, see Managing Data Connections.

                                      +

                                      Creating a Data Connection

                                      The data connection of DataArts Factory is created based on the data connection of Management Center. For details about how to create a data connection, see Configuring DataArts Studio Data Connection Parameters.

                                      Viewing Connection References

                                      To view the references of a connection, perform the following steps:

                                      -
                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                      3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                      4. Click to display the connection list.
                                      5. Right-click a connection in the list and select View Reference.
                                      6. In the displayed Reference List dialog box, view the references of the connection.
                                        Figure 1 Reference List
                                        +
                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                        2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                        3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                        4. Click to display the connection list.
                                        5. Right-click a connection in the list and select View Reference.
                                        6. In the displayed Reference List dialog box, view the jobs or scripts that use the connection.
                                          Figure 1 Reference List
                                      @@ -16,3 +16,10 @@
                                      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0405.html b/docs/dataartsstudio/umn/dataartsstudio_01_0405.html index 5d05f9264..3ff957fd7 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0405.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0405.html @@ -4,9 +4,9 @@

                                      After creating a data connection, you can create a database on the console or using a SQL script.

                                      • (Recommended) Console: You can directly create a database on the DataArts Studio DataArts Factory console with no code.
                                      • SQL script: You can also develop and execute a SQL script for creating a database in the SQL editor of DataArts Studio's DataArts Factory module or a data lake product, and then use the script to create a database.

                                      This section describes how to create a database on the DataArts Factory console.

                                      -

                                      Prerequisites

                                      • You have already enabled the corresponding cloud services.
                                      • A data connection has been created. For details, see Creating a Data Connection.
                                      • MRS API connections cannot be used to manage databases in a visualized mode. You are advised to create a database using SQL scripts.
                                      • Before deleting a database, ensure that the database is not in use and is not associated with any data tables.
                                      +

                                      Prerequisites

                                      • You have already enabled the corresponding cloud services. for example, the MRS service.
                                      • A data connection has been created. For details, see Creating a Data Connection.
                                      • MRS API connections cannot be used to manage databases in a visualized mode. You are advised to create a database using SQL scripts.
                                      • Before deleting a database, ensure that the database is not in use and is not associated with any data tables.
                                      -

                                      Creating a Database on the DataArts Factory Console

                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                      3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                      4. In the script development menu, click . Right-click the data connection for which you want to create a database, and choose Create Database from the shortcut menu. Set the parameters based on Table 1. +

                                        Creating a Database on the DataArts Factory Console

                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                        2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                        3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                        4. In the script development menu, click . Right-click the data connection for which you want to create a database, and choose Create Database from the shortcut menu. Set the parameters based on Table 1.
                                          + + + +
                                          Table 1 Creating a database

                                          Parameter

                                          Mandatory

                                          @@ -36,7 +36,7 @@
                                        5. Click OK.
                                        6. -

                                          Related Operations

                                          • Modify a database: In the script development menu, click . Expand a data connection, right-click a database name, select Edit, and modify the database information.
                                          • Delete a database: In the script development menu, click . Expand a data connection, right-click a database name, select Delete, and click OK in the displayed dialog box.

                                            Deleted databases cannot be recovered. Exercise caution when performing this operation.

                                            +

                                            Related Operations

                                            • Modify a database: In the script development menu, click . Expand a data connection, right-click a database name, select Edit, and modify the database information.
                                            • Delete a database: In the script development menu, click . Expand a data connection, right-click a database name, select Delete, and click OK in the displayed dialog box.

                                              Deleted databases cannot be recovered. Exercise caution when performing this operation.

                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0408.html b/docs/dataartsstudio/umn/dataartsstudio_01_0408.html index ab393a4cc..41f2264dd 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0408.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0408.html @@ -24,6 +24,8 @@
                                          • +

                                          If you select this option, the node will not be executed, and a success message will be returned.

                                          Task Groups

                                          +

                                          No

                                          +

                                          Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                          +
                                          diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0461.html b/docs/dataartsstudio/umn/dataartsstudio_01_0461.html index 572cfe262..cc49dbce9 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0461.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0461.html @@ -26,7 +26,7 @@

                                      Yes

                                      Click to edit the source and destination data to be transformed.

                                      +

                                      Click to edit the source and destination data to be transformed.

                                      The supported source data types are DLI, OBS and MySQL.

                                      • When the source data type is DLI, the supported destination data types are DWS, GES, CSS, OBS, and DLI.
                                      • When the source data type is MySQL, the supported destination data type is MySQL.
                                      • When the source data type is OBS, the supported destination data can be of the DLI type and the DWS type.
                                      NOTICE:
                                      • Data transformation from DLI to DWS:

                                        Before importing data from DataArts Factory to DWS, ensure that a DWS data connection and a table have been created.

                                        @@ -68,7 +68,7 @@

                                      Yes

                                      Whether to re-execute a node if it fails to be executed. Possible values:

                                      -
                                      • Yes: The node will be re-executed, and the following parameters must be configured:
                                        • Retry upon Timeout
                                        • Maximum Retries
                                        • Retry Interval (seconds)
                                        +
                                        • Yes: The node will be re-executed, and the following parameters must be configured:
                                          • Retry upon Timeout
                                          • Maximum Retries
                                          • Retry Interval (seconds)
                                        • No: The node will not be re-executed. This is the default setting.
                                          NOTE:

                                          If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                          If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                          Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                          @@ -91,6 +91,13 @@

                                      If you select this option, the node will not be executed, and a success message will be returned.

                                      Task Groups

                                      +

                                      No

                                      +

                                      Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                      +
                                      @@ -121,17 +128,17 @@

                                      Modify

                                      Click to modify the parameter settings. After the modification, save the settings.

                                      +

                                      Click to modify the parameter settings. After the modification, save the settings.

                                      Delete

                                      Click to delete the parameter settings.

                                      +

                                      Click to delete the parameter settings.

                                      View Details

                                      Click to view details about the table created based on the input lineage.

                                      +

                                      Click to view details about the table created based on the input lineage.

                                      Output

                                      @@ -154,17 +161,17 @@

                                      Modify

                                      Click to modify the parameter settings. After the modification, save the settings.

                                      +

                                      Click to modify the parameter settings. After the modification, save the settings.

                                      Delete

                                      Click to delete the parameter settings.

                                      +

                                      Click to delete the parameter settings.

                                      View Details

                                      Click to view details about the table created based on the output lineage.

                                      +

                                      Click to view details about the table created based on the output lineage.

                                      Yes

                                      Whether to re-execute a node if it fails to be executed. Possible values:

                                      -
                                      • Yes: The node will be re-executed, and the following parameters must be configured:
                                        • Retry upon Timeout
                                        • Maximum Retries
                                        • Retry Interval (seconds)
                                        +
                                        • Yes: The node will be re-executed, and the following parameters must be configured:
                                          • Retry upon Timeout
                                          • Maximum Retries
                                          • Retry Interval (seconds)
                                        • No: The node will not be re-executed. This is the default setting.
                                          NOTE:

                                          If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                          If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                          Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                          @@ -79,6 +79,13 @@

                                      If you select this option, the node will not be executed, and a success message will be returned.

                                      Task Groups

                                      +

                                      No

                                      +

                                      Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                      +
                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0463.html b/docs/dataartsstudio/umn/dataartsstudio_01_0463.html index 88bfcbcc0..724e49aef 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0463.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0463.html @@ -55,7 +55,7 @@

                                  Yes

                                  Whether to re-execute a node if it fails to be executed. Possible values:

                                  -
                                  • Yes: The node will be re-executed, and the following parameters must be configured:
                                    • Retry upon Timeout
                                    • Maximum Retries
                                    • Retry Interval (seconds)
                                    +
                                    • Yes: The node will be re-executed, and the following parameters must be configured:
                                      • Retry upon Timeout
                                      • Maximum Retries
                                      • Retry Interval (seconds)
                                    • No: The node will not be re-executed. This is the default setting.
                                      NOTE:

                                      If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                      If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                      Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                      @@ -78,6 +78,13 @@

                                  If you select this option, the node will not be executed, and a success message will be returned.

                                  Task Groups

                                  +

                                  No

                                  +

                                  Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                  +
                                  diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0464.html b/docs/dataartsstudio/umn/dataartsstudio_01_0464.html index 44482694e..26f82603f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0464.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0464.html @@ -77,7 +77,7 @@

                                  Yes

                                  Whether to re-execute a node if it fails to be executed. Possible values:

                                  -
                                  • Yes: The node will be re-executed, and the following parameters must be configured:
                                    • Retry upon Timeout
                                    • Maximum Retries
                                    • Retry Interval (seconds)
                                    +
                                    • Yes: The node will be re-executed, and the following parameters must be configured:
                                      • Retry upon Timeout
                                      • Maximum Retries
                                      • Retry Interval (seconds)
                                    • No: The node will not be re-executed. This is the default setting.
                                      NOTE:

                                      If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                      If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                      Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                      @@ -100,6 +100,13 @@

                                  If you select this option, the node will not be executed, and a success message will be returned.

                                  Task Groups

                                  +

                                  No

                                  +

                                  Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                  +
                                  @@ -130,17 +137,17 @@

                              Modify

                              Click to modify the parameter settings. After the modification, save the settings.

                              +

                              Click to modify the parameter settings. After the modification, save the settings.

                              Delete

                              Click to delete the parameter settings.

                              +

                              Click to delete the parameter settings.

                              View Details

                              Click to view details about the table created based on the input lineage.

                              +

                              Click to view details about the table created based on the input lineage.

                              Output

                              @@ -163,17 +170,17 @@

                              Modify

                              Click to modify the parameter settings. After the modification, save the settings.

                              +

                              Click to modify the parameter settings. After the modification, save the settings.

                              Delete

                              Click to delete the parameter settings.

                              +

                              Click to delete the parameter settings.

                              View Details

                              Click to view details about the table created based on the output lineage.

                              +

                              Click to view details about the table created based on the output lineage.

                              If you select this option, the node will not be executed, and a success message will be returned.

                              Task Groups

                              +

                              No

                              +

                              Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                              +
                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0467.html b/docs/dataartsstudio/umn/dataartsstudio_01_0467.html index 5378e0937..58df7e2fc 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0467.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0467.html @@ -90,6 +90,13 @@
                            15. If you select this option, the node will not be executed, and a success message will be returned.

                              Task Groups

                              +

                              No

                              +

                              Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                              +
                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0468.html b/docs/dataartsstudio/umn/dataartsstudio_01_0468.html index 793882355..acc306645 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0468.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0468.html @@ -64,7 +64,7 @@ }

                              In the preceding information, message_template_name indicates the template name, and tags indicates all tags in the template.

                            16. -

                              For details about how to configure SMN, see section Publishing a Message/ Introduction of the Simple Message Notification User Guide.

                              +

                              For details about how to configure SMN, see section the Simple Message Notification User Guide.

                              Yes

                              Whether to re-execute a node if it fails to be executed. Possible values:

                              -
                              • Yes: The node will be re-executed, and the following parameters must be configured:
                                • Retry upon Timeout
                                • Maximum Retries
                                • Retry Interval (seconds)
                                +
                                • Yes: The node will be re-executed, and the following parameters must be configured:
                                  • Retry upon Timeout
                                  • Maximum Retries
                                  • Retry Interval (seconds)
                                • No: The node will not be re-executed. This is the default setting.
                                  NOTE:

                                  If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                  If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                  Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                  @@ -115,6 +115,13 @@

                              If you select this option, the node will not be executed, and a success message will be returned.

                              Task Groups

                              +

                              No

                              +

                              Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                              +
                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0469.html b/docs/dataartsstudio/umn/dataartsstudio_01_0469.html index 7e08feaf3..58b41b543 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0469.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0469.html @@ -2,7 +2,7 @@

                              Dummy

                              Functions

                              The Dummy node is empty and does not perform any operations. It is used to simplify the complex connection relationships of nodes. Figure 1 shows an example.

                              -
                              Figure 1 Connection modes
                              +
                              Figure 1 Connection modes

                              Parameters

                              Table 1 describes the parameter of Dummy nodes.

                              @@ -32,3 +32,10 @@
                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0470.html b/docs/dataartsstudio/umn/dataartsstudio_01_0470.html index d319737d4..7594cdbef 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0470.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0470.html @@ -3,7 +3,7 @@

                              Setting Up Scheduling for a Job

                              This section describes how to set up scheduling for an orchestrated job.

                              -

                              Prerequisites

                              +

                              Prerequisites

                              Constraints

                              • Set an appropriate value for this parameter. A maximum of five instances can be concurrently executed in a job. If the start time of a job instance is later than the configured job execution time, the job instances in the subsequent batch will be queued. As a result, the job execution costs a longer time than expected. For CDM and ETL jobs, the recurrence must be at least 5 minutes. In addition, the recurrence should be adjusted based on the data volume of the job table and the update frequency of the source table.
                              • If you use DataArts Studio DataArts Factory to schedule a CDM migration job and configure a scheduled task for the job in DataArts Migration, both configurations take effect. To ensure unified service logic and avoid scheduling conflicts, enable job scheduling in DataArts Factory and do not configure a scheduled task for the job in DataArts Migration.
                              @@ -18,10 +18,13 @@
                            17. Scheduling Type

                              Scheduling type of the job. Available options include:

                              -
                              • Run once: You need to manually execute the job.
                              • Run periodically: The job is executed periodically. For details about the parameters, see Table 2.
                                NOTE:

                                For jobs that are periodically scheduled, you can select Manual confirmation. After that, job instances on the Monitor Instance page are in waiting confirmation state. When you click Execute, the jobs are in waiting execution state. When you rerun instances, they are in waiting confirmation state. When you click Execute, the instances are in waiting execution state. In PatchData scenarios, PatchData job instances are in waiting confirmation state on the Monitor PatchData page. When you click Execute on the Monitor Instance page, PatchData job instances are in waiting execution state. On the Batch Jobs page, job instances are in waiting confirmation state. When you click Execute, the jobs are in waiting execution state.

                                -

                                During job export, if requireManualConfirmBeforeExecute is set to true, Manual confirmation is selected by default after job import. If requireManualConfirmBeforeExecute is set to false, Manual confirmation is not selected by default.

                                +

                              Scheduling type of the job. Available options include:

                              +
                              • Run once: You need to manually execute the job.
                              • Run periodically: The job is executed periodically. For details about the parameters, see Table 2.
                                • Manual confirmation: If this option is selected, the job instance can be executed only after manual confirmation. If manual confirmation is not performed, the job instance cannot be executed.
                                  NOTE:

                                  In job instance execution scenarios, job instances are in waiting confirmation state on the Monitor Instance page. When you click Execute, the job instances are in waiting execution state.

                                  +

                                  When you rerun instances, they are in waiting confirmation state. When you click Execute, the instances are in waiting execution state.

                                  +

                                  In PatchData scenarios, PatchData job instances are in waiting confirmation state on the Monitor PatchData page. When you click Execute on the Monitor Instance page, PatchData job instances are in waiting execution state.

                                  +

                                  In batch job monitoring scenarios, job instances are in waiting confirmation state on the Batch Jobs page. When you click Execute, the job instances are in waiting execution state.

                                  +
                              • Event-based: The job will be executed when certain external conditions are met. For details about the parameters, see Table 3.

                              Select a configured task group. For details, see Configuring Task Groups.

                              Do not select is selected by default.

                              -

                              After a task group is configured, you can control the number of concurrent nodes in the current workspace in a fine-grained manner. For example, if a job contains multiple nodes or patch data, you can control the number of concurrent nodes in the current workspace.

                              -

                              Example 1: The maximum number of concurrent tasks in the task group is set to 2, and a job has five nodes. When the job runs, only two nodes are running and the other nodes are waiting to run.

                              +

                              If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                              +

                              Example 1: The maximum number of concurrent tasks in the task group is set to 2, and a job has five nodes. When the job runs, only two nodes are running and the other nodes are waiting.

                              Example 2: The maximum number of concurrent tasks in the task group is set to 2, and the number of concurrent periods for a PatchData job is set to 5. When the PatchData job runs, two PatchData job instances are running, and the other job instances are waiting to run. The waiting instances can be delivered normally after a period of time.

                              +

                              Example 3: If the same task group is configured for multiple jobs, and the maximum number of concurrent tasks in the task group is set to 2, only two jobs are running and the other jobs are waiting. If the same task group is configured for multiple job nodes, the maximum number of concurrent tasks in the task group is set to 2, and there are five job nodes in total, two nodes are running and the other nodes are waiting.

                              +
                              NOTE:

                              For a pipeline job, you can configure a task group for each node or for the job. A task group configured for a node is prior to one configured for the job.

                              +

                              The frequency at which the scheduling task is executed, which can be:

                              Set an appropriate value for this parameter. A maximum of five instances can be concurrently executed in a job. If the start time of a job instance is later than the configured job execution time, the job instances in the subsequent batch will be queued. As a result, the job execution costs a longer time than expected. For CDM and ETL jobs, the recurrence must be at least 5 minutes. In addition, the recurrence should be adjusted based on the data volume of the job table and the update frequency of the source table.

                              You can modify the scheduling period of a running job.

                              -
                              • Minutes: The job starts at the top of the hour. The interval is accurate to minute. After the scheduling ends at the end time of the current day, the scheduling automatically starts on the next day.
                              • Hours: You can select Interval Hour, indicating that the job starts at a specified time point and that the interval is accurate to hour. After the scheduling ends at the end time of the current day, the scheduling automatically starts on the next day. You can also select Discrete Hour and specify any hour in a day to schedule the job.
                              • Every day: The job starts at a specified time on a day. The scheduling period is one day.
                              • Every week: You can select a specified time point of one or more days in a week.
                              • Every month: You can select a specified time point of one or more days in a month. You can select the last day of each month.
                              +
                              • Minutes: The job starts at the top of the hour. The interval is accurate to minute. After the scheduling ends at the end time of the current day, the scheduling automatically starts on the next day.
                                NOTE:

                                If you select Minutes for Scheduling Frequency, the job cannot be scheduled based on the configured interval, that is, the job cannot be executed at a fixed frequency across hours. For example:

                                +
                                • A scheduling policy is configured at 14:20 on June 19, 2024. According to the policy, the scheduling starts at 00:30 and ends at 23:59, at an interval of 30 minutes. The job is actually scheduled at 14:30:00, 15:30:00, 16:30:00, 17:30:00, 18:30:00, and more on June 19, 2024.
                                • A scheduling policy is configured at 14:20 on June 19, 2024. According to the policy, the scheduling starts at 00:00 and ends at 23:59, at an interval of 50 minutes. The job is actually scheduled at 14:50:00, 15:00:00, 15:50:00, 16:00:00, 16:50:00, 17:00:00, 17:50:00, and more on June 19, 2024.
                                +
                                +
                              • Hours: You can select Interval Hour, indicating that the job starts at a specified time point and that the interval is accurate to hour. After the scheduling ends at the end time of the current day, the scheduling automatically starts on the next day. You can also select Discrete Hour and specify any hour in a day to schedule the job.
                              • Every day: The job starts at a specified time on a day. The scheduling period is one day.
                              • Every week: You can select a specified time point of one or more days in a week.
                              • Every month: You can select a specified time point of one or more days in a month. In addition, you can select Last day of each month.
                              +
                              NOTE:

                              DataArts Studio does not support concurrent running of PatchData instances and periodic job instances of underlying services (such as CDM and DLI). To prevent PatchData instances from affecting periodic job instances and avoid exceptions, ensure that they do not run at the same time.

                              +

                              Scheduling Calendar

                              @@ -76,24 +87,24 @@
                              • OBS File: An EL expression is supported.
                              • Listening Interval: Set a value ranging from 1 to 60, in minutes.
                              • Timeout: Set a value ranging from 1 to 1440, in minutes.

                              Dependency Job

                              +

                              Dependency job

                              You can select jobs that are executed periodically in different workspaces as dependency jobs. The current job starts only after the dependency jobs are executed. You can click Parse Dependency to automatically identify job dependencies.

                              +

                              You can select jobs that are executed periodically in different workspaces as dependency jobs. The current job starts only after the dependency jobs are executed. You can click Parse Dependency to automatically identify job dependencies.

                              NOTE:

                              For details about job dependency rules across workspaces, see Job Dependency Rule.

                              Currently, DataArts Factory supports two types of job dependency policies, that is, dependency between jobs whose scheduling periods are traditional periods and dependency between jobs whose scheduling periods are natural periods. You can select either of them. The scheduling periods for new DataArts Studio instances are natural periods.

                              -
                              Figure 1 Dependency between jobs whose scheduling periods are traditional periods
                              -
                              Figure 2 Dependency between jobs whose scheduling periods are natural periods
                              +
                              Figure 1 Dependency between jobs whose scheduling periods are traditional periods
                              +
                              Figure 2 Dependency between jobs whose scheduling periods are natural periods

                              Policy for Current job If Dependency job Fails

                              Policy for processing the current job when one or more instances of its dependency job fail to be executed in its period.

                              -
                              • Pending

                                Waits to execute the current job, which affects the execution of subsequent jobs. You can force the dependency job to be executed successfully.

                                +

                              Policy for processing the current job when one or more instances of its dependency job fail to be executed in its period.

                              +
                              • Pending

                                Waits to execute the current job, which affects the execution of subsequent jobs. You can force the dependency job to be executed successfully.

                              • Continue

                                Continues to execute the current job.

                                -
                              • Cancel

                                Cancels the current job. Its status becomes Canceled.

                                +
                              • Cancel

                                Cancels the current job. Its status becomes Canceled.

                              -
                              For example, the recurrence of the current job is 1 hour and that of its dependency jobs is 5 minutes.
                              • If the value of this parameter is set to Cancel, the current job will be canceled as long as one of the 12 instances of its dependency job fails.
                              • If the value of this parameter is set to Continue, the current job will be executed after the 12 instances of its dependency job are executed.
                                NOTE:

                                You can set this parameter for multiple jobs in a batch. For details, see Configuring a Default Item. This parameter takes effect only for new jobs.

                                +
                                For example, the recurrence of the current job is 1 hour and that of its dependency jobs is 5 minutes.
                                • If the value of this parameter is set to Cancel, the current job will be canceled as long as one of the 12 instances of its dependency job fails.
                                • If the value of this parameter is set to Continue, the current job will be executed after the 12 instances of its dependency job are executed.
                                  NOTE:

                                  You can set this parameter for multiple jobs in a batch. For details, see Configuring a Default Item. This parameter takes effect only for new jobs.

                                @@ -101,20 +112,27 @@

                              Run After Dependency job Ends

                              If a job depends on other jobs, the job is executed only after its dependency job instances are executed within a specified time range. If the dependency job instances are not successfully executed, the current job is in waiting state.

                              +

                              If a job depends on other jobs, the job is executed only after its dependency job instances are executed within a specified time range. If the dependency job instances are not successfully executed, the current job is in waiting state.

                              If you select this option, the system checks whether all job instances in the previous cycle have been executed before executing the current job.

                              When configuring job dependencies, you can filter dependent jobs based on whether they are being scheduled.

                              +

                              Dependency Job

                              When configuring job dependencies, you can filter dependent jobs based on whether they are being scheduled. This prevents downstream job failures caused by upstream dependent jobs not being scheduled.

                              • All jobs
                              • Running jobs

                              Dependency Cycle

                              +
                              • Same Cycle
                              • Previous N Cycle. N range is from 1 to 30.
                                NOTE:
                                • If a daily job depends on a job scheduled by interval hour, the dependency rule can be All instances, Any instance, Last instance, or Default. Default indicates that the previous scheduling dependency rule remains unchanged.
                                • If a daily job depends on a job scheduled by discrete hour, the dependency rule can be All instances, Any instance, Last instance, or Default. Default indicates that the previous scheduling dependency rule remains unchanged.
                                • The dependencies between jobs using other scheduling periods remain unchanged, and the dependency rule is Default.
                                +
                                +
                              +

                              Cross-Cycle Dependency

                              Dependency between job instances

                              -
                              • Independent on the previous schedule cycle: You can set Concurrency to set the number of job instances that are concurrently executed. If you set it to 1, a batch is executed only after the previous batch is executed (the execution is successful, cancelled, or failed).
                              • Self-dependent (The job can be rescheduled only after it is executed in the current schedule cycle. Before that, the job is in Waiting state.)
                              • Skip waiting instances and run the latest instance: Skipped job instances will be canceled and not executed. If the execution of a job instance takes a long time, multiple subsequent job instances may be skipped. However, if these job instances need to be executed, skipping them may cause service logic errors. For example, if partitioned tables are required but redundant job instances are skipped, some partitioned tables may go missing. Exercise caution when selecting this option.
                                NOTE:
                                • Skip waiting instances and run the latest instance is only supported for jobs scheduled by minute or hour.
                                • If the number of concurrent jobs is small and no instance has been generated, blocked instances will not be skipped.
                                • If a job with a shorter period depends on a job with a longer period, some instances may not be skipped and still be executed.
                                +
                                • Independent on the previous schedule cycle: You can set Concurrency to set the number of job instances that are concurrently executed. If you set it to 1, a batch is executed only after the previous batch is executed (the execution is successful, cancelled, or failed).
                                • Self-dependent: The job can be rescheduled only after it is executed in the current schedule cycle. Before that, the job is in Waiting state.
                                • Skip waiting instances and run the latest instance: Skipped job instances will be canceled and not executed. If the execution of a job instance takes a long time, multiple subsequent job instances may be skipped. However, if these job instances need to be executed, skipping them may cause service logic errors. For example, if partitioned tables are required but redundant job instances are skipped, some partitioned tables may go missing. Exercise caution when selecting this option.
                                  NOTE:
                                  • Skip waiting instances and run the latest instance is only supported for jobs scheduled by minute or hour.
                                  • If the number of concurrent jobs is small and no instance has been generated, blocked instances will not be skipped.
                                  • If a job with a shorter period depends on a job with a longer period, some instances may not be skipped and still be executed.

                              Enable Dry Run

                              +

                              If you select this option, the job will not be executed, and a success message will be returned.

                              +

                              Task Groups

                              +

                              Select a configured task group. For details, see Configuring Task Groups.

                              +

                              Do not select is selected by default.

                              +

                              If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                              +
                              NOTE:

                              For a pipeline job, you can configure a task group for each node or for the job. A task group configured for a node is prior to one configured for the job.

                              +
                              +
                              @@ -141,6 +173,20 @@
                              • KAFKA

                              Enable Dry Run

                              +

                              If you select this option, the job will not be executed, and a success message will be returned.

                              +

                              Task Groups

                              +

                              Select a configured task group. For details, see Configuring Task Groups.

                              +

                              Do not select is selected by default.

                              +

                              If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                              +
                              NOTE:

                              For a pipeline job, you can configure a task group for each node or for the job. A task group configured for a node is prior to one configured for the job.

                              +
                              +

                              Parameters for KAFKA event-triggered jobs

                              Access Policy

                              Select the location where data is to be accessed:

                              -
                              • Access from the last location: For the first access, data is accessed from the most recently recorded location. For the subsequent access, data is accessed from the previously recoded location.
                              • Access from a new location: Data is accessed from the most recently recorded location each time.
                              +
                              • Access from the last location: For the first access, data is accessed from the most recently recorded location. For the subsequent access, data is accessed from the previously recoded location.
                              • Access from a new location: Data is accessed from the most recently recorded location each time.

                              Failure Policy

                              @@ -176,6 +222,34 @@
                              • Suspend
                              • Ignore the failure and proceed with the next event

                              Enable Dry Run

                              +

                              If you select this option, the job will not be executed, and a success message will be returned.

                              +

                              Task Groups

                              +

                              Select a configured task group. For details, see Configuring Task Groups.

                              +

                              Do not select is selected by default.

                              +

                              If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                              +
                              NOTE:

                              For a pipeline job, you can configure a task group for each node or for the job. A task group configured for a node is prior to one configured for the job.

                              +
                              +

                              Enable Dry Run

                              +

                              If you select this option, the job will not be executed, and a success message will be returned.

                              +

                              Task Groups

                              +

                              Select a configured task group. For details, see Configuring Task Groups.

                              +

                              Do not select is selected by default.

                              +

                              If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                              +
                              NOTE:

                              For a pipeline job, you can configure a task group for each node or for the job. A task group configured for a node is prior to one configured for the job.

                              +
                              +
                              @@ -191,8 +265,8 @@

                              Scheduling Type

                              Scheduling type of the job. Available options include:

                              -
                              • Run once: You need to manually execute the job.
                              • Run periodically: The job runs automatically and periodically.
                              • Event-based: The job runs when certain external conditions are met.
                              +

                              Scheduling type of the job. Available options include:

                              +
                              • Run once: You need to manually run the job.
                              • Run periodically: The job runs automatically and periodically.
                              • Event-based: The job runs when certain external conditions are met.

                              Parameters displayed when Scheduling Type is Run periodically

                              @@ -201,23 +275,21 @@

                              From and to

                              The period during which a scheduling task takes effect.

                              -

                              You can set it to today or tomorrow by clicking the time box and then Today or Tomorrow.

                              Recurrence

                              The frequency at which the scheduling task is executed, which can be:

                              -
                              • Minutes
                              • Hours

                                You can select Interval Hour or Discrete Hour. If you select Discrete Hour, the job can only be scheduled by natural period.

                                -
                              • Every day
                              • Every week
                              • Every month

                                You can select the last day of each month.

                                -
                              +
                              • Minutes
                              • Hours
                              • Every day
                              • Every week
                              • Every month

                              For CDM and ETL jobs, the recurrence must be at least 5 minutes. In addition, the recurrence should be adjusted based on the data volume of the job table and the update frequency of the source table.

                              You can modify the scheduling period of a running job.

                              Cross-Cycle Dependency

                              Dependency between job instances

                              -
                              • Independent on the previous schedule cycle
                              • Self-dependent (The current job can continue to run only after the previous schedule cycle is successfully finished.)
                              • Skip waiting instances and run the latest instance
                              +

                              Dependency between job instances

                              +
                              • Independent on the previous schedule cycle

                                Set Concurrency. Number of job instances that are concurrently executed. If you set it to 1, a batch is executed only after the previous batch is executed (the execution is successful, cancelled, or failed).

                                +
                              • Self-dependent: The job can be rescheduled only after it is executed in the current schedule cycle. Before that, the job is in Waiting state.

                              Parameters displayed when Scheduling Type is Event-based

                              @@ -230,12 +302,12 @@

                              Connection Name

                              Before selecting a data connection, ensure that a Kafka data connection has been created in the Management Center.

                              +

                              Before selecting a data connection, ensure that a Kafka data connection has been created in the Management Center. This parameter is mandatory only when Event Type is set to KAFKA.

                              Topic

                              Topic of the message to be sent to the Kafka.

                              +

                              Topic of the message to be sent to the Kafka. This parameter is mandatory only when Event Type is set to KAFKA.

                              Consumer Group

                              @@ -257,6 +329,12 @@

                              Interval at which the system detects the stream for new messages. The unit of the interval can be Seconds or Minutes.

                              Access Policy

                              +
                              • Access from the last location
                              • Access from a new location

                                This parameter is mandatory only when Event Type is set to KAFKA.

                                +
                              +

                              Failure Policy

                              Select a policy to be performed after scheduling fails.

                              @@ -274,3 +352,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0471.html b/docs/dataartsstudio/umn/dataartsstudio_01_0471.html index 3805f9a08..e109e6511 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0471.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0471.html @@ -4,8 +4,8 @@

                              This section describes how to view the references of a script or all the scripts in a folder.

                              Prerequisites

                              A script has been developed based on Developing Scripts.

                              -

                              Procedure

                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                              3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                              4. To view the references of a script, right-click the script and select View Reference.

                                To view the references of all the scripts in a folder, right-click the folder and select View Reference.

                                -
                              5. In the displayed dialog box, you can view the references of a script or all the scripts in the folder.
                                Figure 1 References of a script
                                +

                                Procedure

                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                4. To view the references of a script, right-click the script and select View Reference.

                                  To view the references of all the scripts in a folder, right-click the folder and select View Reference.

                                  +
                                5. In the displayed dialog box, you can view the references of a script or all the scripts in the folder.
                                  Figure 1 References of a script
                              @@ -15,3 +15,10 @@
                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0489.html b/docs/dataartsstudio/umn/dataartsstudio_01_0489.html deleted file mode 100644 index ca3baed7f..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0489.html +++ /dev/null @@ -1,48 +0,0 @@ - - -

                              Http Trigger

                              -

                              Functions

                              Http Trigger is a cross-platform scheduling trigger node of DataArts Studio. If you want to trigger a job on DataArts Studio after a job on another scheduling system is complete, you can use the Http Trigger node.

                              -
                              -

                              Parameters

                              Table 1 describes the parameter of the Http Trigger node.

                              - -
                              - - - - - - - - - - - - - - - - - -
                              Table 1 Parameter of the Http Trigger node

                              Parameter

                              -

                              Mandatory

                              -

                              Description

                              -

                              Node ID

                              -

                              No

                              -

                              ID of the Http Trigger node. When you add an Http Trigger node, the system automatically generates a node ID, which is unique in the workspace and cannot be changed.

                              -

                              Node Name

                              -

                              Yes

                              -

                              Name of a node. The name must contain 1 to 128 characters, including only letters, numbers, underscores (_), hyphens (-), slashes (/), less-than signs (<), and greater-than signs (>).

                              -

                              Maximum Wait Time

                              -

                              Yes

                              -

                              Maximum wait time for HTTP messages. If no message is received within this time, the node and its subsequent nodes are canceled and the job is stopped.

                              -

                              The value ranges from 1 to 24 hours. The default value is 24 hours.

                              -
                              -
                              -
                              -
                              -
                              - -
                              - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0494.html b/docs/dataartsstudio/umn/dataartsstudio_01_0494.html index b47053726..b9238fc0e 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0494.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0494.html @@ -2,11 +2,10 @@

                              Expression Overview

                              Node parameter values in a DataArts Factory job can be dynamically generated based on the running environment by using Expression Language (EL). You can determine whether to execute this node based on the input parameters of the pipeline and the output of the upstream node. EL uses simple arithmetic and logic to calculate and references embedded objects, including job objects and tool objects.

                              -

                              Job object: provides properties and methods of obtaining the output message, job scheduling plan time, and job execution time of the previous node in a job.

                              -

                              Tool job: Provides methods of operating character strings, time, and JSON. For example, truncating a substring from a string or formatting time.

                              +
                              • Job object: provides properties and methods of obtaining the output message, job scheduling plan time, and job execution time of the previous node in a job.
                              • Tool job: Provides methods of operating character strings, time, and JSON. For example, truncating a substring from a string or formatting time.

                              Syntax

                              Expression syntax:

                              #{expr}
                              -

                              In the preceding information, expr indicates an expression. # and {} are common operators used in EL, allowing you to access job properties using embedded objects.

                              +

                              In the preceding information, expr indicates an expression. # and {} are common operators used in EL, allowing you to access job properties using embedded objects.

                              Example

                              In the URL parameter of the Rest Client node, use expression tableName=#{JSONUtil.path(Job.getNodeOutput("get_cluster"),"tables[0].table_name")}.

                              Expression description:

                              @@ -14,20 +13,17 @@

                              Debugging Methods

                              You can debug EL expressions using the following methods.

                              This section uses the #{DateUtil.now()} expression as an example.

                              -
                              1. Use the DIS Client node.
                                • Prerequisites: A DIS stream is available.
                                • Method: Select the DIS Client node, write the EL expression in the data to be sent, and click Test. Then right-click the node to view the log. The value of the EL expression is printed in the log.

                                  -

                                  +
                                  1. Use the Kafka Client node.
                                    • Prerequisites: An MRS cluster with the Kafka component is available.
                                    • Method: Select the Kafka Client node, write the EL expression in the data to be sent, and click Test. Then right-click the node to view the log. The value of the EL expression is printed in the log.

                                      +

                                    -
                                  2. Use the Kafka Client node.
                                    • Prerequisites: An MRS cluster with the Kafka component is available.
                                    • Method: Select the Kafka Client node, write the EL expression in the data to be sent, and click Test. Then right-click the node to view the log. The value of the EL expression is printed in the log.

                                      -

                                      +
                                    • Use the shell node.
                                      • Prerequisites: An ECS is available.
                                      • Method: Create a host connection, print the EL expression using echo, and click Test. Then view the log. The value of the EL expression is printed in the log.

                                        +

                                      -
                                    • Use the shell node.
                                      • Prerequisites: An ECS is available.
                                      • Method: Create a host connection, print the EL expression using echo, and click Test. Then view the log. The value of the EL expression is printed in the log.

                                        -

                                        -
                                      -
                                    • Use the Create OBS node.

                                      If none of the preceding methods is available, use the Create OBS node and create an OBS path with the value of the EL expression as its name. You can click Test and go to the OBS console to view the name of the created path.

                                      -

                                      +
                                    • Use the Create OBS node.

                                      If the preceding methods are unavailable, use the Create OBS node and create an OBS path with the value of the EL expression as its name. You can click Test and go to the OBS console to view the name of the created path.

                                      +

                                      -

                                      +

                              @@ -38,3 +34,10 @@
                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0496.html b/docs/dataartsstudio/umn/dataartsstudio_01_0496.html index ad9fc83c7..cd78c5a61 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0496.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0496.html @@ -18,13 +18,20 @@

                              AD

                              y

                              +

                              y (within one year)

                              Year

                              2001

                              Y (across years)

                              +

                              Year

                              +

                              2001

                              +

                              M

                              Month in a year

                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0498.html b/docs/dataartsstudio/umn/dataartsstudio_01_0498.html index 2dbdf3162..1d3f7d360 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0498.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0498.html @@ -64,7 +64,7 @@

                              For example, to check whether a node is running successfully, you can use the following command, where test indicates the node name:

                              #{(Job.getNodeStatus("test")) == "success" }

                              Obtain the running status of the test node:

                              +

                              Obtains the running status of the test node:

                              #{Job.getNodeStatus("test")}

                              Obtains the output of a specified node. This method can only obtain the output of the previous dependent node.

                              • Obtain the output of the test node:

                                #{Job.getNodeOutput("test")}

                                +
                              • Obtains the output of the test node:

                                #{Job.getNodeOutput("test")}

                              • If the previous node has no execution result, the output is null.
                              • If the output of a node is a field, the output result is in the format like [["000"]]. In this case, you can use the EL expression to split the string result and obtain the field value output by the previous node. Note that the output result type is string. If you want to output the original data type, you need to use the EL expression of the For Each node and the loop embedded objects supported by the node.

                                #{StringUtil.split(StringUtil.split(StringUtil.split(Job.getNodeOutput("Name of the previous node"),"]")[0],"[")[0],"\\"")[0]}

                              • If the output of a node contains two or more fields, the output result is in the format like [["000"],["001"]]. In this case, you need to obtain the output result using the EL expression of the For Each node and the loop embedded objects supported by the node, for example, #{Loop.current[0]}.

                              Obtain the value of the test parameter:

                              +

                              Obtains the value of the test parameter:

                              #{Job.getParam("test")}

                              Obtains the plan time character string in a specified pattern. Pattern indicates the date and time mode. For details, see Date and Time Mode.

                              Obtain the planned job scheduling time, which is accurate to millisecond:

                              +

                              Obtains the planned job scheduling time, which is accurate to millisecond:

                              #{Job.getPlanTime("yyyy-MM-dd HH:mm:ss:SSS")}

                              Obtains the time character string of the day before the plan time. Pattern indicates the date and time mode. For details, see Date and Time Mode.

                              Obtain the time on the previous day of the planned job scheduling time, which is accurate to date:

                              +

                              Obtains the time on the previous day of the planned job scheduling time, which is accurate to date:

                              #{Job.getYesterday("yyyy-MM-dd HH:mm:ss:SSS")}

                              Obtains the time character string of last hour before the plan time. Pattern indicates the date and time mode. For details, see Date and Time Mode.

                              Obtain the time one hour before the planned job scheduling time, which is accurate to hour:

                              +

                              Obtains the time one hour before the planned job scheduling time, which is accurate to hour:

                              #{Job.getLastHour("yyyy-MM-dd HH:mm:ss:SSS")}

                              Obtains the data recorded during the running of a specified node. Currently, only the IDs of the jobs running using SQL statements on the DLI SQL node can be obtained. This method can only obtain the output of the previous dependent node.

                              For example, to obtain the job ID of the third statement on DLI node DLI_INSERT_DATA, run the following command: #{JSONUtil.path(Job.getRunningData("DLI_INSERT_DATA"),"jobIds[2]")}.

                              Obtain the ID of the job run by the third statement in the test of the DLI SQL node:

                              +

                              Obtains the ID of the job run by the third statement in the test of the DLI SQL node:

                              #{JSONUtil.path(Job.getRunningData("test"),"jobIds[2]")}

                              Returns the job ID in the first Insert SQL statement of the specified DLI SQL or Transform Load node. If the nodeName parameter is not specified, the job ID in the first DLI Insert SQL statement of the DLI SQL node is obtained. If the job ID cannot be obtained, the null value is returned.

                              Obtain the ID of job run by the first Insert SQL statement in the test of the DLI SQL node:

                              +

                              Obtains the ID of job run by the first Insert SQL statement in the test of the DLI SQL node:

                              #{Job.getInsertJobId("test")}

                              Returns the time string of the num working day before a planned time specified by pattern. The value of num must be a positive integer. If no result that meets the specified condition is found, null is returned.

                              This EL expression is suitable for selecting custom dates in a calendar to schedule jobs.

                              Obtains the date of the fifth working day before a specified day.

                              +

                              Obtain the date of the fifth working day before a specified job scheduling day.

                              #{Job.getPreviousWorkday(5, "yyyyMMdd")}

                              Returns the time string of the num non-working day before a planned time specified by pattern. The value of num must be a positive integer. If no result that meets the specified condition is found, null is returned.

                              This EL expression is suitable for selecting custom dates in a calendar to schedule jobs.

                              Obtains the date of the first non-working day before a specified day.

                              +

                              Obtains the date of the first non-working day before a specified job scheduling day.

                              #{Job.getPreviousNonWorkday(1, "yyyyMMdd")}

                              String getCalendarPreviousWorkday(String calendarName, Integer num, String pattern)

                              +

                              Returns the time string of the num working day before a planned time in the calendar specified by pattern. The value of num must be a positive integer. If no result that meets the specified condition is found, null is returned.

                              +

                              This EL expression is suitable for selecting custom dates in a calendar to schedule jobs.

                              +

                              Obtains the date of the working day five days before the specified planned job scheduling time in the calendar.

                              +

                              #{Job.getCalendarPreviousWorkday(5, "yyyyMMdd")}

                              +

                              String getCalendarPreviousNonWorkday(String calendarName, Integer num, String pattern)

                              +

                              Returns the time string of the num non-working day before a planned time in the calendar specified by pattern. The value of num must be a positive integer. If no result that meets the specified condition is found, null is returned.

                              +

                              This EL expression is suitable for selecting custom dates in a calendar to schedule jobs.

                              +

                              Obtains the date of the non-working day one day before the specified planned job scheduling time in the calendar.

                              +

                              #{Job.getCalendarPreviousNonWorkday(1, "yyyyMMdd")}

                              +

                              String getCalendarNextWorkday(String calendarName, Integer num, String pattern)

                              +

                              Returns the time string of the num working day after a planned time in the calendar specified by pattern. The value of num must be a positive integer. If no result that meets the specified condition is found, null is returned.

                              +

                              This EL expression is suitable for selecting custom dates in a calendar to schedule jobs.

                              +

                              Obtains the date of the working day five days after the specified planned job scheduling time in the calendar.

                              +

                              #{Job.getCalendarNextWorkday(5, "yyyyMMdd")}

                              +

                              String getCalendarNextNonWorkday(String calendarName, Integer num, String pattern)

                              +

                              Returns the time string of the num non-working day after a planned time in the calendar specified by pattern. The value of num must be a positive integer. If no result that meets the specified condition is found, null is returned.

                              +

                              This EL expression is suitable for selecting custom dates in a calendar to schedule jobs.

                              +

                              Obtains the date of the non-working day one day after the specified planned job scheduling time in the calendar.

                              +

                              #{Job.getPreviousNonWorkday(1, "yyyyMMdd")}

                              +
                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0500.html b/docs/dataartsstudio/umn/dataartsstudio_01_0500.html index 21de1a118..294b1d4cd 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0500.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0500.html @@ -38,10 +38,16 @@

                              Subtracts one day from the planned job scheduling time and convert the time to the yyyy-MM-dd format.

                              #{DateUtil.format(DateUtil.addDays(Job.planTime,-1),"yyyy-MM-dd")}

                              -

                              Subtracts one day from the planned job scheduling time and convert the time to the week format.

                              +

                              Subtracts one day from the planned job scheduling time and convert the time to the week format. (y: within one year)

                              • #{DateUtil.format(DateUtil.addDays(Job.planTime,-1),"yyyyw")}

                                If Job.planTime is January 7, 2024, value 20241 is returned.

                              -
                              • #{DateUtil.format(DateUtil.addDays(Job.planTime,-1),"yyyyww")}

                                If Job.planTime is January 7, 2024, value 202401 is returned.

                                +
                                • #{DateUtil.format(DateUtil.addDays(Job.planTime,-1),"yyyyww")}

                                  If Job.planTime is January 7, 2024, value 202401 is returned.

                                  +
                                +

                                Subtracts one day from the planned job scheduling time and convert the time to the week format. (Y: across years)

                                +
                                • #{DateUtil.format(DateUtil.addDays(Job.planTime,-7),"YYYYww")}

                                  If Job.planTime is January 7, 2024, value 202401 is returned.

                                  +
                                  NOTE:

                                  The differences between yyyy and YYYY are as follows:

                                  +
                                  • YYYY indicates the week year. It can correctly process the number of weeks across years.
                                  • yyyy indicates the calendar year, which may cause an inaccurate number of weeks across years.
                                  • Therefore, YYYY is used for processing cross-year services. Except that, yyyy should be used.
                                  • Currently, the calendar week is from Sunday to Saturday, rather than from Monday to Sunday.
                                  +
                              Table 1 Solution Parameters

                              Parameter

                              Description

                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0504.html b/docs/dataartsstudio/umn/dataartsstudio_01_0504.html index 757c3af62..323e504b7 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0504.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0504.html @@ -9,54 +9,54 @@

                              Importing Environment Variables

                              This function is available only if the OBS service is available. If OBS is unavailable, variables can be imported from the local PC.

                              -
                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                              3. In the navigation tree on the left, choose Specifications.
                              4. Click Environment Variables. On the Environment Variables page, click Import.
                              5. In the Import Environment Variable dialog box, select an environment variable file from OBS or a local path and the duplicate name policy.

                                Figure 1 Importing Environment Variables
                                +
                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                3. In the navigation tree on the left, choose Specifications.
                                4. Click Environment Variables. On the Environment Variables page, click Import.
                                5. In the Import Environment Variable dialog box, select an environment variable file from OBS or a local path and the duplicate name policy.

                                  Figure 1 Importing Environment Variables

                              -

                              Configuration Method

                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                              3. In the navigation tree on the left, choose Specifications.
                              4. On the Environment Variable page, set the variables or constants listed in Table 1 and click Save.

                                The difference between a variable and a constant lies in whether their values need to be reconfigured when they are imported to another workspace or project.

                                +

                                Exporting Environment Variables

                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                3. In the navigation tree on the left, choose Specifications.
                                4. Click Environment Variable. On the Environment Variable page, click Export to export environment variables.
                                +
                                +

                                Configuration Method

                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                3. In the navigation tree on the left, choose Specifications.
                                4. On the Environment Variable page, set the variables or constants listed in Table 1 and click Save.

                                  The difference between a variable and a constant lies in whether their values need to be reconfigured when they are imported to another workspace or project.

                                  • The value of a variable (such as workspace name) varies depending on the workspace. When exporting a variable from a workspace and import it to another workspace, you must reconfigure its value.
                                  • The value of a constant in different workspaces is the same. When importing a constant to another workspace, you do not need to reconfigure its value.
                                  -
                                  Figure 2 Configuring environment variables
                                  -

                                  -

                                  +
                                  Figure 2 Configuring environment variables
                                  -
                                  Table 1 Configuring environment variables

                                  Parameter

                                  +
                                  - - - - - - - - - - -
                                  Table 1 Configuring environment variables

                                  Parameter

                                  Mandatory

                                  +

                                  Mandatory

                                  Description

                                  +

                                  Description

                                  Parameter

                                  +

                                  Parameter

                                  Yes

                                  +

                                  Yes

                                  The parameter name must be unique, consist of 1 to 64 characters, and contain only letters, digits, underscores (_), and hyphens (-).

                                  +

                                  The parameter name must be unique, consist of 1 to 64 characters, and contain only letters, digits, underscores (_), and hyphens (-).

                                  The parameter name must be in the format set in Configuring Script Variables. For example, if the format set in the script variable definition is ${dlf.}, the parameter name must be set to dlf.xxx.

                                  Value

                                  +

                                  Value

                                  Yes

                                  +

                                  Yes

                                  Parameter values support constants and EL expressions but do not support system functions. For example, 123 and abc are supported. If the parameter value is a string, add double quotation marks (""), for example, "05".

                                  +

                                  Parameter values support constants and EL expressions but do not support system functions. For example, 123 and abc are supported. If the parameter value is a string, add double quotation marks (""), for example, "05".

                                  For details about how to use EL expressions, see Expression Overview.

                                  Description

                                  +

                                  Description

                                  No

                                  +

                                  No

                                  Parameter description

                                  +

                                  Parameter description

                                  -

                                  After configuring an environment variable, you can add, edit, or delete it.

                                  -
                                  • Add: Click Add to add an environment variable.
                                  • Edit: If the parameter value is a constant, change the parameter value in the text box. If the parameter value is an EL expression, click next to the text box to edit the EL expression. Click Save.
                                  • Delete: Click next to the parameter value text box to delete the environment variable.
                                  +

                                  You can add, modify, delete, and reset environment variables.

                                  +
                                  • Add an environment variable: Click Add. After an environment variable is added, Add is displayed for it.
                                  • Edit an environment variable: If the parameter value is a constant, change the parameter value in the text box. If the parameter value is an EL expression, click next to the text box to edit the EL expression. Click Save. After an environment variable is modified, Modify is displayed for it.
                                  • Delete an environment variable: Click Delete next to the parameter value text box. After an environment variable is deleted, Delete is displayed for it.
                                  • Reset an environment variable: When modifying or deleting an environment variable, you can click Reset in the Operation column to reset the variable value to the original value.

                                  How-Tos

                                  The configured environment variables can be used in either of the following ways:

                                  @@ -64,9 +64,8 @@

                                  Example

                                  Context:

                                  • A job named test has been created in the DataArts Factory module.
                                  • An environment variable has been added. The parameter name is job and the parameter value is 123.
                                  -
                                  1. Open test and drag a Create OBS node from the node library.
                                  2. On the Node Properties tab page, configure the node properties.

                                    Figure 3 Configuring parameters for the Create OBS node
                                    +
                                    1. Open test and drag a Create OBS node from the node library.
                                    2. On the Node Properties tab page, configure the node properties.

                                      Figure 3 Configuring parameters for the Create OBS node

                                    3. Click Save and then Monitor to monitor the running status of the job.
                                    -

                                  @@ -75,3 +74,10 @@
                                  + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0505.html b/docs/dataartsstudio/umn/dataartsstudio_01_0505.html index adc7de5fa..2bc57ab91 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0505.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0505.html @@ -12,7 +12,7 @@ - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0506.html b/docs/dataartsstudio/umn/dataartsstudio_01_0506.html index 3ec832012..f84683253 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0506.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0506.html @@ -2,12 +2,13 @@

                                  Overview

                                  Choose Monitoring > Overview. On the Overview page, you can view the statistics of job instances in charts. Currently, you can view seven types of statistics:

                                  -
                                  • Status
                                    • You can filter out your or all job instances by selecting My Instances or All, and filter out job instances of the current day by selecting Today.
                                    • You can filter out your or all job instances by selecting My Instances or All, and filter out job instances of the current day by selecting Yesterday.
                                    • You can filter out your or all job instances by selecting My Instances or All, and filter out job instances of the current day by selecting Two days ago.
                                    • You can filter out your or all job instances by selecting My Instances or All, and filter out job instances of the current day by selecting Last 7 days.
                                    • You can click a status to go to the Monitor Instance page and view details about all jobs in the status.
                                      • The statistics include the monitoring data of the instances of real-time jobs. When you click a status, you will not be redirected to the Monitor Instance page of real-time jobs. Instead, you can only view the details of the instances of batch jobs.
                                      • By default, the system displays all job instances of the current day.
                                      +
                                      • Status
                                        • You can filter out your or all job instances by selecting My Instances or All, and filter out job instances of the current day by selecting Today.
                                        • You can filter out your or all job instances by selecting My Instances or All, and filter out job instances of the current day by selecting Yesterday.
                                        • You can filter out your or all job instances by selecting My Instances or All, and filter out job instances of the current day by selecting Two days ago.
                                        • You can filter out your or all job instances by selecting My Instances or All, and filter out job instances of the current day by selecting Last 7 days.
                                        • You can click a status to go to the Monitor Instance page and view details about all jobs in the status.
                                          • The statistics include the monitoring data of the instances of real-time jobs. When you click a status, you will not be redirected to the Monitor Instance page of real-time jobs. Instead, you can only view the details of the instances of batch jobs.
                                          • By default, the system displays all job instances of the current day.
                                          • You can view the total number of instances that meet the filter criteria, the total number of instances that were successfully executed, and the percentage of such instances.
                                            Figure 1 Status
                                            +
                                      • Completed Tasks

                                        Successfully executed instances of the current day are collected once an hour. A task is a job node.

                                        -
                                        • You can view the number of all types of job nodes successfully executed on the previous day, on the current day, and over the last seven days on average.
                                        • You can view the number of a specific type of job nodes successfully executed on the previous day, on the current day, and over the last seven days on average.
                                        +
                                        • You can specify a date and view the number of all job nodes successfully executed on the previous day, on the selected day, and over the last seven days on average.
                                        • You can specify a date and view the number of different types of job nodes successfully executed on the previous day, on the selected day, and over the last seven days on average.
                                      • Tasks

                                        Number of tasks (operators in jobs) started in five minutes. Data of 30 days is available.

                                        • You can filter the operators started on each day within 30 days.
                                        • You can view the curve of the number of all operators that have been started.
                                        • You can view the curve of the number of different types of operators that have been started.
                                        @@ -36,3 +37,10 @@
                                      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0508.html b/docs/dataartsstudio/umn/dataartsstudio_01_0508.html index af6cf3cf1..e5aad7b50 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0508.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0508.html @@ -3,100 +3,89 @@

                                      Monitoring a Batch Job

                                      In the batch processing mode, data is processed periodically in batches based on the job-level scheduling plan, which is used in scenarios with low real-time requirements. This type of job is a pipeline that consists of one or more nodes and is scheduled as a whole. It cannot run for an unlimited period of time, that is, it must end after running for a certain period of time.

                                      You can choose Monitor Job and click the Batch Job Monitoring tab to view the scheduling status, scheduling period, and start time of a batch job, and perform the operations listed in Table 1.

                                      -
                                      Figure 1 Monitoring a Batch Job
                                      -

                                      +
                                      Figure 1 Monitoring batch jobs
                                      +

                                      -
                                      Table 1 Operations supported by batch job monitoring

                                      No.

                                      +
                                      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + +
                                      Table 1 Operations supported by batch job monitoring

                                      Operation

                                      Operation

                                      -

                                      Description

                                      +

                                      Description

                                      1

                                      +

                                      Filtering jobs by Job Name, Owner, CDM Job, Scheduling Identity, or Node Type

                                      Filtering jobs by Job Name, Owner, CDM Job, or Node Type

                                      -

                                      N/A

                                      +

                                      N/A

                                      2

                                      +

                                      Filtering jobs by whether notifications have been configured, scheduling status, job tag, or next plan time

                                      Filtering jobs by whether notifications have been configured, scheduling status, job tag, or next plan time

                                      -

                                      You can filter jobs for which no notification has been configured by notification type (such as exception or failure) so that you can set alarm notifications in batches.

                                      +

                                      You can filter jobs for which no notification has been configured by notification type (such as exception or failure) so that you can set alarm notifications in batches.

                                      3

                                      +

                                      Performing operations on jobs in a batch

                                      Performing operations on jobs in a batch

                                      -

                                      Select multiple jobs and perform operations on them.

                                      +

                                      Select multiple jobs and perform operations on them.

                                      4

                                      +

                                      Viewing job instance status

                                      Viewing job instance status

                                      -

                                      Click in front of the job name. The Last Instance page is displayed. You can view information about the last instance of the job.

                                      +

                                      Click in front of the job name. The Last Instance information is displayed. You can view information about the last instance of the job.

                                      +

                                      In the Operation column of the last instance, you can view the run logs of the instance and rerun the instance.

                                      +
                                      NOTE:
                                      • The rerun job may run at the same time as a normally scheduled job. Check whether the job supports concurrent running. If the number or names of nodes in the job change, the rerunning starts from the first node. If you rerun a job instance in successful state, the rerunning starts from the first node.
                                      • When rerunning a job instance, you need to set Parameters to Use and Ignore OBS Listening.

                                        You can set Parameters to Use to Parameters of the original job or Parameters of the latest job.

                                        +

                                        Ignore OBS Listening is set to Yes by default.

                                        +
                                      • In enterprise mode, developers cannot rerun job instances.
                                      +

                                      5

                                      +

                                      Viewing node information of the job

                                      Viewing node information of the job

                                      -

                                      Click a job name. On the displayed page, click the job node and view its associated jobs/scripts and monitoring information.

                                      +

                                      Click a job name. On the displayed page, click the job node and view its associated jobs/scripts and monitoring information.

                                      Click a job name. On the displayed page, view the job instance. For details, see Batch Job Monitoring: Job Instances.

                                      6

                                      +

                                      Job scheduling operations

                                      Job scheduling operations

                                      -

                                      You can run, pause, recover, stop, and configure scheduling. For details, see Batch Job Monitoring: Scheduling a Job.

                                      +

                                      You can run, pause, recover, stop, and configure scheduling. For details, see Batch Job Monitoring: Scheduling a Job.

                                      7

                                      +

                                      Configuring notifications

                                      Configuring notifications

                                      -

                                      In the Operation column of a job, choose More > Set Notification. In the displayed dialog box, configure notification parameters. Table 1 describes the notification parameters.

                                      +

                                      In the Operation column of a job, choose More > Configuration Notification. In the displayed dialog box, configure notification parameters. Table 1 describes the notification parameters.

                                      +

                                      You can also click Configure Notification to configure notifications for jobs based on Table 1.

                                      +

                                      For how to modify existing notification configuration, see Notification Management. If you switch to the Manage Notification page from a job, only the configurations of the job are displayed.

                                      8

                                      +

                                      Monitoring instances

                                      Monitoring instances

                                      -

                                      In the Operation column of a job, choose More > Monitor Instance to view the running records of all instances of the job.

                                      +

                                      In the Operation column of a job, choose More > Monitor Instance to view the running records of all instances of the job.

                                      9

                                      +

                                      Configuring scheduling information

                                      PatchData

                                      -

                                      In the Operation column of a job, choose More > PatchData. For details, see Batch Job Monitoring: PatchData.

                                      +

                                      In the Operation column of a job, click More and select Scheduling Setup. On the displayed job development page, you can view and configure the job scheduling information.

                                      +
                                      NOTE:

                                      You cannot configure scheduling information for a running job.

                                      +

                                      10

                                      +

                                      PatchData

                                      Adding a job tag

                                      -

                                      In the Operation column of a job, choose More > Add Job Tag. For details, see Batch Job Monitoring: Adding a Job Tag.

                                      +

                                      In the Operation column of a job, choose More > PatchData. For details, see Batch Job Monitoring: PatchData.

                                      +

                                      This function is available only for jobs that are scheduled periodically.

                                      11

                                      +

                                      Adding a job tag

                                      Viewing a job dependency graph

                                      -

                                      In the Operation column of a job, choose More > View Job Dependency Graph. For details, see Batch Processing: Viewing a Job Dependency Graph.

                                      +

                                      In the Operation column of a job, choose More > Add Job Tag. For details, see Batch Job Monitoring: Adding a Job Tag.

                                      12

                                      +

                                      Viewing a job dependency graph

                                      Exporting all data

                                      +

                                      In the Operation column of a job, click More and select View Job Dependency Graph. For details, see Batch Job Monitoring: Viewing a Job Dependency Graph.

                                      Click Export All Data. In the displayed Export All Data dialog box, click OK. After the export is complete, go to the Download Center page to view the exported data.

                                      +

                                      Exporting all data

                                      +

                                      Click Export All Data. In the displayed Export All Data dialog box, click OK. After the export is complete, go to the Download Center page to view the exported data.

                                      If the default storage path is not configured, you can set a storage path and select Set as default OBS path in the Export to OBS dialog box.

                                      A maximum of 30 MB data can be exported. If there are more than 30 MB data, the data will be automatically truncated.

                                      The exported job instances map job nodes. You cannot export data by selecting job names. Instead, you can select the data to be exported by setting filter criteria.

                                      @@ -108,7 +97,7 @@

                                      Click a job name. On the displayed page, view the job parameters, properties, and instances.

                                      Click a node of a job to view the node properties, script content, and node monitoring information.

                                      In addition, you can view the current job version and job scheduling status, schedule, stop, or pause a job, configure patch data, notification, or update frequency for a job.

                                      -

                                      Batch Job Monitoring: Job Instances

                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                      3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                      4. Click the Batch Job Monitoring tab.
                                      5. Click a job name. On the displayed page, click the Job Instances tab to view job instances. You can perform the following operations:
                                        • Select Show Instances to Be Generated and set the time range to filter job instances that are expected to be generated in the future.

                                          A maximum of 100 instances expected to be generated can be displayed.

                                          +

                                          Batch Job Monitoring: Job Instances

                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                          3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                          4. Click the Batch Job Monitoring tab.
                                          5. Click a job name. On the displayed page, click the Job Instances tab to view job instances. You can perform the following operations:
                                            • Select Show Instances to Be Generated and set the time range to filter job instances that are expected to be generated in the future.

                                              A maximum of 100 instances expected to be generated can be displayed.

                                            • Freeze or unfreeze job instances that are expected to be generated in the future. You can click Freeze or Unfreeze above the job instance list, or click More in the Operation column and select Freeze or Unfreeze.

                                              Freeze: You can only freeze job instances that have not been generated or are in waiting state.

                                              You cannot freeze jobs instances that have been frozen.

                                              @@ -120,22 +109,22 @@

                                          Batch Job Monitoring: Scheduling a Job

                                          After developing a job, you can manage job scheduling tasks on the Monitor Job page. Specific operations include to run, pause, restore, or stop scheduling.

                                          -
                                          Figure 2 Scheduling a job
                                          -
                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                          3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                          4. Click the Batch Job Monitoring tab.

                                            You can filter batch processing jobs by scheduling type or scheduling frequency.

                                            +
                                            Figure 2 Scheduling a job
                                            +
                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                            2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                            3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                            4. Click the Batch Job Monitoring tab.

                                              You can filter batch processing jobs by scheduling type or scheduling frequency.

                                            5. In the Operation column of the job, click Execute, Pause, Restore, or Stop Scheduling.

                                            If a dependent job has been configured for a batch job, you can select either Start Current Job Only or Start Current and Depended Jobs when submitting the batch job. For details about how to configure dependent jobs, see Setting Up Scheduling for a Job Using the Batch Processing Mode.

                                            If the job is on the baseline task link, the system automatically displays a dialog box indicating that the baseline is associated when the scheduling is paused or stopped.

                                            If the job is on the baseline task link or is depended on by other jobs, the system automatically displays a dialog box when the scheduling is paused or stopped.

                                            -
                                            Figure 3 Starting a job
                                            +
                                            Figure 3 Starting a job

                                            Batch Job Monitoring: PatchData

                                            A job executes a scheduling task to generate a series of instances in a certain period of time. This series of instances are called PatchData. PatchData can be used to fix the job instances that have data errors in the historical records or to build job records for debugging programs.

                                            Only the periodically scheduled jobs support PatchData. For details about the execution records of PatchData, see Monitoring PatchData.

                                            Do not modify the job configuration when PatchData is being performed. Otherwise, job instances generated during PatchData will be affected.

                                            -
                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                            2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                            3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                            4. Click the Batch Job Monitoring tab.
                                            5. In the Operation column of the job, choose More > Configure PatchData.
                                            6. Configure PatchData parameters based on Table 2.
                                              Figure 4 PatchData parameters
                                              +
                                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                              3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                              4. Click the Batch Job Monitoring tab.
                                              5. In the Operation column of the job, choose More > Configure PatchData.
                                              6. Configure PatchData parameters based on Table 2.
                                                Figure 4 PatchData parameters

                                                + + + +
                                                Table 2 Parameters

                                                Parameter

                                                @@ -174,12 +163,14 @@

                                                You also need to set the following PatchData parameters:

                                                You can click Add Date Range to add multiple discrete date ranges for PatchData. You must set at least one date range.

                                                You can click Delete to delete discrete date ranges.

                                                +
                                                NOTE:

                                                DataArts Studio does not support concurrent running of PatchData instances and periodic job instances of underlying services (such as CDM and DLI). To prevent PatchData instances from affecting periodic job instances and avoid exceptions, ensure that they do not run at the same time.

                                                +

                                                Run PatchData Tasks Periodically

                                                • Yes: PatchData jobs will be executed based on the configured period.

                                                  The first value indicates a specific value.

                                                  -

                                                  The second value indicates that data is patched based on a specified period, for example, minutes, hours, days, weeks, or months.

                                                  +

                                                  The second value indicates that data is patched based on a specified period, for example, hours, days, weeks, or months.

                                                  NOTE:

                                                  If you set a period, PatchData tasks will be scheduled based on that period. If the job is scheduled every few minutes, hours, or days, PatchData tasks will be scheduled based on the period you set. For example, if you want to patch data from 00:00 on Jan 1, 2023 to 00:00 on Feb 1, 2023 for an hourly job that starts at 01:00 every day, and set the PatchData period to two days, PatchData tasks will be scheduled at 00:00 on Jan 1, 2023, 00:00 on Jan 3, 2023, 00:00 on Jan 5, 2023, and so on. If the PatchData task scheduling period is in months and the first scheduling date falls on the last day of a month, PatchData tasks will be scheduled on the last day of each month.

                                                • No: PatchData jobs will not be executed periodically. Instead, the system executes PatchData jobs based on the existing rule.
                                                @@ -206,7 +197,9 @@

                                                Upstream or Downstream Job

                                                Select the upstream and downstream jobs (jobs that depend on the current job) that require PatchData.

                                                -

                                                The job dependency graph is displayed. For details about the operations on the job dependency graph, see Batch Processing: Viewing a Job Dependency Graph.

                                                +

                                                The job dependency graph is displayed. For details about the operations on the job dependency graph, see Batch Job Monitoring: Viewing a Job Dependency Graph.

                                                +
                                                NOTE:

                                                If you set Run PatchData Tasks Periodically to Yes, you can only select an upstream or downstream job with the same scheduling period as the job.

                                                +

                                                Patch Data by Day

                                                @@ -251,17 +244,17 @@
                                              7. Click OK. The system starts to perform PatchData and the PatchData Monitoring page is displayed.
                                              8. Batch Job Monitoring: Adding a Job Tag

                                                Tags can be added to jobs to facilitate job instance filtering.

                                                -
                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                                4. Click the Batch Job Monitoring tab.
                                                5. In the Operation column of a job, choose More > Add Job Tag.
                                                6. In the Add Job Tag dialog box displayed, set the job tag parameters.
                                                  Figure 5 Parameters for adding a job tag
                                                  +
                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                  2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                  3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                                  4. Click the Batch Job Monitoring tab.
                                                  5. In the Operation column of a job, choose More > Add Job Tag.
                                                  6. In the Add Job Tag dialog box displayed, set the job tag parameters.
                                                    Figure 5 Parameters for adding a job tag
                                                  7. Click OK.
                                                -

                                                Batch Processing: Viewing a Job Dependency Graph

                                                In the job dependency graph, you can view the dependencies between jobs.

                                                -
                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                                4. Click the Batch Job Monitoring tab.
                                                5. In the Operation column of a job, choose More > View Job Dependency Graph.
                                                6. On the displayed Job Dependency page, perform any of the following operations:
                                                  • In the upper right corner, select Display complete dependency graphs, Display the current job and its upstream and downstream jobs, or Display the current job and its directly connected jobs.
                                                  • In the search box in the upper right corner, you can enter the name of a node to search for the node. The node found will be highlighted.
                                                  • Click Download to download the job dependency file.
                                                  • Scroll your mouse wheel to zoom in or zoom out the dependency graph.
                                                  • Drag the blank area to view the complete relationship graph.
                                                  • When the cursor is hovered on a job node, the node is marked green, its upstream job is marked blue, and its downstream job is marked orange.
                                                    Figure 6 Marking upstream and downstream job nodes of a node
                                                    -
                                                  • Right-click a job node to view the job, copy the job name, and collapse upstream or downstream jobs.
                                                    Figure 7 Job node operations
                                                    +

                                                    Batch Job Monitoring: Viewing a Job Dependency Graph

                                                    In the job dependency graph, you can view the dependencies between jobs.

                                                    +
                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                    3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                                    4. Click the Batch Job Monitoring tab.
                                                    5. In the Operation column of a job, choose More > View Job Dependency Graph.
                                                    6. On the displayed Job Dependency page, perform any of the following operations:
                                                      • In the upper right corner, select Display complete dependency graphs, Display the current job and its upstream and downstream jobs, or Display the current job and its directly connected jobs.
                                                      • In the search box in the upper right corner, you can enter the name of a node to search for the node. The node found will be highlighted.
                                                      • Click Download to download the job dependency file.
                                                      • Scroll your mouse wheel to zoom in or zoom out the dependency graph.
                                                      • Drag the blank area to view the complete relationship graph.
                                                      • When the cursor is hovered on a job node, the node is marked green, its upstream job is marked blue, and its downstream job is marked orange.
                                                        Figure 6 Marking upstream and downstream job nodes of a node
                                                        +
                                                      • Right-click a job node to view the job, copy the job name, and collapse upstream or downstream jobs.
                                                        Figure 7 Job node operations

                                                    You can also view the node monitoring information of a job on the job details page.

                                                    -
                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                    3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                                    4. Click the Batch Job Monitoring tab.
                                                    5. Click a job name and then a node to view monitoring information of the node.

                                                      Click Edit to access the job development page.

                                                      +
                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                      3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                                      4. Click the Batch Job Monitoring tab.
                                                      5. Click a job name and then a node to view monitoring information of the node.

                                                        Click Edit to access the job development page.

                                                @@ -271,3 +264,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0509.html b/docs/dataartsstudio/umn/dataartsstudio_01_0509.html index aaa14039e..8a6297408 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0509.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0509.html @@ -3,7 +3,7 @@

                                                Monitoring a Real-Time Job

                                                In the real-time processing mode, data is processed in real time, which is used in scenarios with high real-time performance. This type of job is a pipeline that consists of one or more nodes. You can configure scheduling policies for each node, and the tasks started by nodes can keep running for an unlimited period of time. In this type of job, lines with arrows represent only service relationships, rather than task execution processes or data flows.

                                                You can choose Monitor Job and click the Real-Time Job Monitoring tab to view the job status, start time, and end time, and perform the operations listed in Table 1.

                                                -
                                                Figure 1 Real-time job monitoring page
                                                +
                                                Figure 1 Real-time job monitoring page

                                                -
                                                Table 1 Operations supported by real-time job monitoring

                                                No.

                                                @@ -39,7 +39,7 @@

                                                Viewing job instance status

                                                Click job in front of the name. The Last Instance page is displayed. You can view information about the last instance of the job.

                                                +

                                                Click job in front of the name. The Last Instance page is displayed. You can view information about the last instance of the job.

                                                5

                                                @@ -106,10 +106,10 @@

                                                Click a job name. On the displayed page, view the job parameters, properties, and instances.

                                                -

                                                Click a node of a job to view the node properties, script content, and node monitoring information.

                                                +

                                                Click a node of a job to view the node properties, script content, and node monitoring information. On the Nodes tab page, you can view the run logs of the real-time job.

                                                In addition, you can view the current job version and status, start, rerun, and develop jobs, determine whether to display metric monitoring, and set the job refresh frequency.

                                                Real-Time Job Monitoring: Disabling and Restoring a Node

                                                You can disable a node in a real-time job and restore it in another location.

                                                -
                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                3. In the left navigation pane of DataArts Factory, choose Monitoring > Monitor Job.
                                                4. On the Real-Time Job Monitoring tab page, click a job name.
                                                5. On the displayed page, right-click the node and select Disable.
                                                6. Right-click the node and choose Resume from the shortcut menu. The Resume Node Running dialog box is displayed, as shown in Table 2. +
                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                  2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                  3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                                  4. On the Real-Time Job Monitoring tab page, click a job name.
                                                  5. On the displayed page, right-click the node and select Disable.
                                                  6. Right-click the node and choose Resume from the shortcut menu. The Resume Node Running dialog box is displayed, as shown in Table 2.
                                                    @@ -151,7 +151,7 @@

                                                    Real-Time Job Monitoring: Configuring Scheduling for a Node Where Event-driven Scheduling Is Configured

                                                    If event-driven scheduling is configured for a node in a real-time job, right-click the node on the job monitoring details page and choose Configure Scheduling from the shortcut menu to view and modify the scheduling information about the node.

                                                    -
                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                    3. In the left navigation pane of DataArts Factory, choose Monitoring > Monitor Job.
                                                    4. On the Real-Time Job Monitoring tab page, click a job name.
                                                    5. On the displayed page, right-click the node where event-driven scheduling is configured, select Configure Scheduling, and configure the parameters shown in Table 3.
                                                      Figure 2 Configuring scheduling
                                                      +
                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                      3. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                                      4. On the Real-Time Job Monitoring tab page, click a job name.
                                                      5. On the displayed page, right-click the node where event-driven scheduling is configured, select Configure Scheduling, and configure the parameters shown in Table 3.
                                                        Figure 2 Configuring scheduling
                                                    Table 2 Resumption parameters

                                                    Parameter

                                                    Description

                                                    @@ -129,7 +129,7 @@

                                                    Run From

                                                    Parameters for performing the tasks generated during the pause period.

                                                    -

                                                    Position from which running restarts.

                                                    +

                                                    Position from which running restarts.

                                                    • Paused node
                                                    • The first node of the subjob
                                                    @@ -187,3 +187,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0511.html b/docs/dataartsstudio/umn/dataartsstudio_01_0511.html index dea5fa3d3..e49e4ec17 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0511.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0511.html @@ -2,8 +2,8 @@

                                                    Instance Monitoring

                                                    Each time a job is executed, a job instance record is generated. In the navigation pane of the DataArts Factory console, choose Monitoring. On the Monitor Instance page, you can view the job instance information and perform more operations on instances as required.

                                                    -

                                                    You can search for instances by Job Name, Created By, Owner, CDM Job, Node Type, and Job Tag. Search by CDM job is to search for job instances by node.

                                                    -

                                                    Performing Job Instance Operations

                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                    3. In the navigation pane on the left of the DataArts Factory page, choose Monitoring > Monitor Instance
                                                    4. You can stop, rerun, or continue to execute instances or make instances succeed. For details, see Table 1.

                                                      When multiple instances are rerun in batches, the sequence is as follows:

                                                      +

                                                      You can search for instances by Job Name, Created By, Owner, CDM Job, Node Type, and Job Tag. Search by CDM job is to search for job instances by node. In addition, you can filter job instances by status or scheduling mode.

                                                      +

                                                      Performing Job Instance Operations

                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                      3. In the navigation pane on the left of the DataArts Factory page, choose Monitoring > Monitor Instance
                                                      4. You can stop, rerun, or continue to execute instances or make instances succeed. For details, see Table 1.

                                                        When multiple instances are rerun in batches, the sequence is as follows:

                                                        • If a job does not depend on the previous schedule cycle, multiple instances run concurrently.
                                                        • If jobs are dependent on their own, multiple instances are executed in serial mode. The instance that first finishes running in the previous schedule cycle is the first one to rerun.
                                                      5. Table 1 describes the operations that can be performed on the instance.
                                                    Table 3 Policy parameters

                                                    Parameter

                                                    - @@ -32,7 +32,7 @@ @@ -57,6 +57,11 @@ + + + + + + + + + + + + - @@ -111,7 +132,7 @@
                                                    Table 1 Instance monitoring operations

                                                    Operation

                                                    @@ -18,7 +18,7 @@

                                                    If you do not select Exact search, fuzzy search by job name is supported.

                                                    Filtering jobs by CDM Job or Node Type

                                                    +

                                                    Filtering jobs by CDM Job, Job Tag, or Node Type

                                                    N/A

                                                    Rerun a subjob instance that is in the Succeed or Canceled state.

                                                    For details, see Rerunning Job Instances.

                                                    -
                                                    NOTE:

                                                    Manually scheduled jobs cannot be rerun.

                                                    +
                                                    NOTE:
                                                    • Manually scheduled jobs cannot be rerun.
                                                    • In enterprise mode, developers cannot rerun job instances.

                                                    If instances need manual confirmation before they are executed, they are in waiting confirmation state when they are being rerun. When you click Execute, the instances are in waiting execution state.

                                                    Confirm executing instances in pending confirmation state.

                                                    Execute Job Without Dependency

                                                    +

                                                    Select job instances that have dependency relationships and execute them.

                                                    +

                                                    More > Manual Retry

                                                    Retry abnormal instances.

                                                    @@ -84,6 +89,11 @@

                                                    Forcibly change the status of an instance from Abnormal, Canceled, or Failed to Succeed.

                                                    More > Execute Job Without Dependency

                                                    +

                                                    Execute job instances that have dependency relationships.

                                                    +

                                                    More > View

                                                    Go to the job development page and view job information.

                                                    @@ -94,9 +104,20 @@

                                                    You can view the historical performance of a job instance.

                                                    More > View Rerun History

                                                    +

                                                    You can view the job instance rerun records.

                                                    +

                                                    This is possible only if the job instance has rerun at least once.

                                                    +

                                                    More > Execute Preferentially

                                                    +

                                                    Preferentially execute job instances.

                                                    +

                                                    DAG

                                                    Display the DAG so that you can view the dependency between instances and perform O&M operations on the DAG.

                                                    +

                                                    Display the DAG so that you can view the dependency between job instances and perform O&M operations on the DAG.

                                                    For details, see Viewing the DAG.

                                                    -
                                                  7. Click in front of an instance. The running records of all nodes in the instance are displayed.
                                                  8. Table 2 describes the operations that can be performed on the node. +
                                                  9. Click in front of an instance. The running records of all nodes in the instance are displayed.
                                                  10. Table 2 describes the operations that can be performed on the node.
                                                    -
                                                    Table 2 Operations (node)

                                                    Operation

                                                    Description

                                                    @@ -121,6 +142,7 @@

                                                    View Log

                                                    View the log information of a node.

                                                    +

                                                    You can control access to the test run logs. For example, after user A performs a test, user A can view the test run logs on the Monitor Instance page, but user B cannot.

                                                    Manual Retry

                                                    @@ -165,55 +187,76 @@ -

                                                    Rerunning Job Instances

                                                    You can rerun a job instance that is successfully executed or fails to be executed by setting its rerun position.

                                                    -
                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                    3. In the navigation pane on the left of the DataArts Factory page, choose Monitoring > Monitor Instance
                                                    4. In the Operation column of a job, click Rerun to rerun the job instance. Alternatively, click the check box on the left of a job, and then click the Rerun button to rerun the job instance.
                                                      Figure 1 Setting the job rerunning
                                                      -

                                                      +

                                                      Rerunning Job Instances

                                                      In enterprise mode, developers cannot rerun job instances.

                                                      +
                                                      +

                                                      You can rerun a job instance that is successfully executed or fails to be executed by setting its rerun position.

                                                      +
                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                      3. In the navigation pane on the left of the DataArts Factory page, choose Monitoring > Monitor Instance
                                                      4. Locate a job and click Rerun in the Operation column to rerun a job instance. Alternatively, select the check boxes to the left of job names and click Rerun above the job list to rerun multiple job instances.
                                                        Figure 1 Rerunning a job instance
                                                        +
                                                        Figure 2 Rerunning job instances
                                                        +

                                                        When rerunning multiple job instances, you only need to set Rerun From, Parameters to Use, and Ignore OBS Listening.

                                                        +
                                                        -
                                                        - @@ -91,10 +93,10 @@ - - @@ -107,19 +109,19 @@ - - - - @@ -193,3 +195,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0576.html b/docs/dataartsstudio/umn/dataartsstudio_01_0576.html index dadcf4053..d84ac888e 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0576.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0576.html @@ -4,17 +4,17 @@

                                                        CDM provides independent clusters for secure and reliable data migration. Clusters are isolated from each other and cannot access each other.

                                                        CDM clusters can be used in the following scenarios:
                                                        • They can be used to create and run data migration jobs.
                                                        • They can function as agents for connecting Management Center to a data lake.
                                                        -

                                                        Prerequisites

                                                        You have applied for a VPC, subnet, and security group. If the CDM cluster tries to connect to another cloud service, ensure that the cluster and the cloud service are in the same VPC. Otherwise, an EIP is required.
                                                        • If the CDM cluster and a cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other through an intranet.
                                                        • If the CDM cluster and the cloud service are in the same region and VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                        • If the CDM cluster and a cloud service are in different VPCs of the same region, you can create a VPC peering connection to enable them to communicate with each other. For details about how to create a VPC peering connection, see "VPC Peering" in Virtual Private Cloud (VPC) Usage Guide.

                                                          Note: If a VPC peering connection is created, the peer VPC subnet may overlap with the CDM management network. As a result, data sources in the peer VPC cannot be accessed. You are advised to use the Internet for cross-VPC data migration, or contact the administrator to add specific routes for the VPC peering connection in the CDM background.

                                                          +

                                                          Prerequisites

                                                          You have applied for a VPC, subnet, and security group. If the CDM cluster tries to connect to another cloud service, ensure that the cluster and the cloud service are in the same VPC. Otherwise, an EIP is required.
                                                          • If the CDM cluster and a cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other through an intranet.
                                                          • If the CDM cluster and the cloud service are in the same region and VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                          • If the CDM cluster and a cloud service are in different VPCs of the same region, you can create a VPC peering connection to enable them to communicate with each other. For details about how to configure a VPC peering connection, see "VPC Peering Connection" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide

                                                            Note: If a VPC peering connection is created, the peer VPC subnet may overlap with the CDM management network. As a result, data sources in the peer VPC cannot be accessed. You are advised to use the Internet for cross-VPC data migration, or contact the administrator to add specific routes for the VPC peering connection in the CDM background.

                                                          • If the CDM cluster and a cloud service are located in different regions, you need to use the Internet or Direct Connect to enable them to communicate with each other. When using the Internet, ensure that an EIP has been bound to the CDM cluster, the security group of CDM allows outbound traffic from the host where the off-cloud data source is located, the host where the data source is located can access the Internet, and the connection port has been enabled in the firewall rules.
                                                          • In addition, an enterprise project may also affect the communication between the CDM cluster and other cloud services. The CDM cluster can communicate with a cloud service only if they have the same enterprise project.
                                                          -

                                                          Procedure

                                                          If you want to use DataArts Migration but the DataArts Studio instance has no CDM cluster, create one by following the instructions in "Preparations" > "Creating DataArts Studio Instances" > "(Optional) Creating a DataArts Studio Incremental Package" in the DataArts Studio User Guide.

                                                          +

                                                          Scenario

                                                          The DataArts Studio instance does not contain CDM clusters. To use CDM, create a CDM cluster by following the instructions in Creating a DataArts Migration Incremental Package.

                                                          diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0578.html b/docs/dataartsstudio/umn/dataartsstudio_01_0578.html index 03424c011..283789a3e 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0578.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0578.html @@ -1,18 +1,27 @@ -

                                                          Restarting a Cluster

                                                          +

                                                          Restarting a CDM Cluster

                                                          Scenario

                                                          After modifying some configurations (for example, disabling user isolation), you must restart the cluster to make the modification take effect.

                                                          +

                                                          If you restart a CDM cluster process or VM, jobs that are running will fail, and no jobs can be scheduled during the restart. Exercise caution when performing this operation.

                                                          +

                                                          Prerequisites

                                                          You have created a CDM cluster.

                                                          -

                                                          Restarting a cluster

                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
                                                          1. Locate the row that contains the target cluster, click More in the Operation column, and select Restart from the drop-down list.

                                                            Figure 1 Restarting a cluster
                                                            +

                                                            Restarting a cluster

                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
                                                            1. Locate the row that contains the target cluster, click More in the Operation column, and select Restart from the drop-down list.

                                                              Figure 1 Restarting a cluster

                                                            2. Select Restart CDM service process or VM restart and click OK.

                                                              • Restart CDM service process: Only the CDM service process is restarted. The cluster VM will not be restarted.
                                                              • VM restart: The service process will be interrupted and VMs in the cluster will be restarted.

                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0579.html b/docs/dataartsstudio/umn/dataartsstudio_01_0579.html index 188a73d03..799dc1306 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0579.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0579.html @@ -1,22 +1,29 @@ -

                                                          Deleting a Cluster

                                                          +

                                                          Deleting a CDM Cluster

                                                          Scenario

                                                          You can delete a CDM cluster that you no longer use.

                                                          After a CDM cluster is deleted, the cluster and its data are destroyed and cannot be restored. Exercise caution when performing this operation.

                                                          Before deleting a cluster, note the following:

                                                          -
                                                          • Ensure that the cluster is not in use.
                                                          • Ensure that the links and jobs in the cluster have been backed up through the job export function described in Managing Jobs in Batches.
                                                          +
                                                          • Ensure that the cluster is not in use.
                                                          • Ensure that the links and jobs in the cluster have been backed up through the job export function described in Managing CDM Jobs.

                                                          Prerequisites

                                                          You have created a CDM cluster.

                                                          -

                                                          Deleting a Cluster

                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
                                                          1. Delete a cluster using either of the following methods:

                                                            • Locate a cluster, click More in the Operation column, and select Delete.
                                                            • Select a cluster and click Delete above the cluster list.
                                                            -

                                                          2. Enter DELETE and click Yes.

                                                            Figure 1 Deleting a cluster
                                                            +

                                                            Deleting a Cluster

                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
                                                            1. Delete a cluster using either of the following methods:

                                                              • Locate a cluster, click More in the Operation column, and select Delete.
                                                              • Select a cluster and click Delete above the cluster list.
                                                              +

                                                            2. Enter DELETE and click Yes.

                                                              Figure 1 Deleting a cluster

                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0581.html b/docs/dataartsstudio/umn/dataartsstudio_01_0581.html index 8b6e62b05..21ed17f39 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0581.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0581.html @@ -8,14 +8,14 @@
                                                          • Scenario: The ID of the first cluster in the cluster list needs to be obtained and transferred to other nodes as a parameter.
                                                          • Key configurations: Set The response message body parses the transfer parameter of the first Rest Client to clusterId=clusters[0].clusterId. Other Rest Client nodes can reference the ID of the first cluster in ${clusterId} mode.

                                                            When setting The response message body parses the transfer parameter, ensure that the transferred parameter name (for example, clusterId) is unique among all node parameters of the job.

                                                          -
                                                          Figure 1 Rest Client job example 1
                                                          +
                                                          Figure 1 Rest Client job example 1

                                                          -
                                                          Figure 2 JSON message body
                                                          +
                                                          Figure 2 JSON message body

                                                          Obtaining the Return Value Using an EL Expression

                                                          The Rest Client node can be used together with EL expressions. You can select different EL expressions based on scenarios. This section describes how to develop your own jobs based on your service requirements.

                                                          As shown in Figure 3, the Rest Client invokes the API of MRS to query the cluster list and then invokes the Kafka Client to send a message.

                                                          • Scenario: The Kafka Client sends a character string message. The message content is the ID of the first cluster in the cluster list.
                                                          • Key configurations: When you configure the Kafka Client, use the following EL expression to obtain a specific field in the message body returned by the REST API: #{JSONUtil.toString(JSONUtil.path(Job.getNodeOutput("Rest_Client_4901"),"clusters[0].clusterId"))}
                                                          -
                                                          Figure 3 Rest Client job example 2
                                                          +
                                                          Figure 3 Rest Client job example 2
                                                          @@ -24,3 +24,10 @@
                                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0582.html b/docs/dataartsstudio/umn/dataartsstudio_01_0582.html index 6d4f9fe88..799741660 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0582.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0582.html @@ -5,7 +5,7 @@

                                                        You can use a For Each node to execute a subjob in a loop and use a dataset to replace the parameters in the subjob. The key parameters are as follows:

                                                        • Subjob in a Loop: Select the subjob to be executed in a loop.
                                                        • Dataset: Enter a set of parameter values of the subjobs. The value can be a specified dataset such as [['1'],['3'],['2']] or an EL expression such as #{Job.getNodeOutput('preNodeName')}, which is the output value of the previous node.
                                                        • Subjob Parameter Name: The parameter name is the variable defined in the subjob. The parameter value is usually set to a group of data in the dataset. Each time the job is run, the parameter value is transferred to the subjob for use. For example, parameter value #{Loop.current[0]} indicates that the first value of each row of data in the dataset is traversed and transferred to the subjob.

                                                        Figure 1 shows an example For Each node. As shown in the figure, the parameter name of the foreach subjob is result, and the parameter value is the traversal of the one-dimensional array dataset [['1'],['3'],['2']] (that is, the value is 1, 3, and 2 in the first, second, and third loop, respectively).

                                                        -
                                                        Figure 1 For Each node
                                                        +
                                                        Figure 1 For Each node

                                                        For Each Nodes and EL Expressions

                                                        To use For Each nodes properly, you must be familiar with EL expressions. For details about how to use EL expressions, see EL Expressions.

                                                        For Each nodes use the following EL expressions most:

                                                        @@ -83,28 +83,28 @@ INSERT INTO Table_List VALUES ('a_new','a'),('b_2','b'),('c_3','c'),('d_1','d'), SELECT * FROM Table_List;

                                                        The generated data in the Table_List table is as follows:

                                                        -
                                                        Figure 2 Data in the Table_List table
                                                        +
                                                        Figure 2 Data in the Table_List table

                                                      5. Create a subjob named ForeachDemo to be executed cyclically. In this operation, a task containing the DLI SQL node is defined to be executed cyclically.

                                                        1. Access the DataArts Studio DataArts Factory page, choose Develop Job. Create a job named ForeachDemo, select the DLI SQL node, and configure the job as shown in Figure 3.
                                                          In the DLI SQL statement, set the variable to be replaced to ${}. The following SQL statement is used to import all data in the ${Source} table to the ${Destination} table. ${fromTable} and ${toTable} are the variables. The SQL statement is as follows:
                                                          INSERT INTO ${Destination} select * from ${Source};

                                                          Do not use the #{Job.getParam("job_param_name")} EL expression because this expression can only obtain the values of the parameters configured in the current job, but cannot obtain the parameter values transferred from the parent job or the global variables configured in the workspace. The expression only works for the current job.

                                                          To obtain the parameter values passed from the parent job and the global variables configured for the workspace, you are advised to use the ${job_param_name} expression.

                                                          -
                                                          Figure 3 Cyclically executing a subjob
                                                          -
                                                        2. After configuring the SQL statement, configure parameters for the subjob. You only need to set the parameter names, which are used by the For Each operator of the ForeachDemo_master job to identify subjob parameters.
                                                          Figure 4 Configuring subjob parameters
                                                          +
                                                          Figure 3 Cyclically executing a subjob
                                                          +
                                                        3. After configuring the SQL statement, configure parameters for the subjob. You only need to set the parameter names, which are used by the For Each operator of the ForeachDemo_master job to identify subjob parameters.
                                                          Figure 4 Configuring subjob parameters

                                                        4. Save the job.
                                                        -

                                                      6. Create a master job named ForeachDemo_master where the For Each node is located.

                                                        1. Access the DataArts Studio DataArts Studio page and choose Develop Job. Create a data development master job named ForeachDemo_master. Select the DLI SQL and For Each nodes and click and drag to compile the job shown in Figure 5.
                                                          Figure 5 Compiling a job
                                                          +

                                                        2. Create a master job named ForeachDemo_master where the For Each node is located.

                                                          1. Access the DataArts Studio DataArts Studio page and choose Develop Job. Create a data development master job named ForeachDemo_master. Select the DLI SQL and For Each nodes and click and drag to compile the job shown in Figure 5.
                                                            Figure 5 Compiling a job
                                                          2. Configure the properties of the DLI SQL node. Select SQL statement and and enter the following statement. The DLI SQL node reads data from the DLI table Table_List and uses it as the dataset.
                                                            SELECT * FROM Table_List;
                                                            -
                                                            Figure 6 DLI SQL node configuration
                                                            +
                                                            Figure 6 DLI SQL node configuration
                                                          3. Configure properties for the For Each node.
                                                            • Subjob in a Loop: Select ForeachDemo, which is the subjob that has been developed in step 2.
                                                            • Dataset: Enter the execution result of the select statement on the DLI SQL node. Use the #{Job.getNodeOutput('preDLI')} expression, where preDLI is the name of the previous node.
                                                            • Subjob Parameter Name: used to transfer data in the dataset to the subjob Source corresponds to the first column in the Table_List table of the dataset, and Destination corresponds to the second column. Therefore, enter EL expression #{Loop.current[0]} for Source and #{Loop.current[1]} for Destination.
                                                            -
                                                            Figure 7 Configuring properties for the For Each node
                                                            +
                                                            Figure 7 Configuring properties for the For Each node
                                                          4. Save the job.
                                                          -

                                                        3. Test the main job.

                                                          1. Click Test above the canvas to test the main job. After the main job is executed, the subjob is automatically invoked through the For Each node and executed.
                                                          2. In the navigation pane on the left, choose Monitor Instance to view the job execution status. After the job is successfully executed, you can view the subjob instances generated on the For Each node. Because the dataset contains six rows of data, six subjob instances are generated.
                                                            Figure 8 Viewing job instances
                                                            +

                                                          3. Test the main job.

                                                            1. Click Test above the canvas to test the main job. After the main job is executed, the subjob is automatically invoked through the For Each node and executed.
                                                            2. In the navigation pane on the left, choose Monitor Instance to view the job execution status. After the job is successfully executed, you can view the subjob instances generated on the For Each node. Because the dataset contains six rows of data, six subjob instances are generated.
                                                              Figure 8 Viewing job instances
                                                            3. Check whether the data has been inserted into the six DLI destination tables. You can create a DLI SQL script on the DataArts Factory page and run the following commands to import data into the table. You can also run the following SQL commands in the SQL editor on the DLI console.
                                                              /* Run the following command to query the data in a table (table a is used as an example): */
                                                               SELECT * FROM a;

                                                              Compare the obtained data with the data in Insert data into the source data table. The inserted data meets the expectation.

                                                              -
                                                              Figure 9 Destination table data
                                                              +
                                                              Figure 9 Destination table data

                                                          @@ -119,3 +119,10 @@ SELECT * FROM a;
                                                      7. + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0583.html b/docs/dataartsstudio/umn/dataartsstudio_01_0583.html index d3c8e5b8f..972d838cb 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0583.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0583.html @@ -7,18 +7,18 @@

                                                        IF statements use EL expressions. You can select EL expressions and follow the instruction in this section to develop jobs.

                                                        Determining the IF Statement Branch to Be Executed Based on the Execution Status of the Previous Node

                                                        Scenario

                                                        Generally, you can determine the IF statement branch to be executed based on whether the previous CDM node is successfully executed. For details on how to set IF statements, see Figure 1.

                                                        -
                                                        Figure 1 Example job
                                                        +
                                                        Figure 1 Example job

                                                        Configuration Method

                                                        -
                                                        1. Log in to the DataArts Studio console, locate the target DataArts Studio instance, and click Access on the instance card.
                                                        2. Click the Workspaces tab. In the workspace list, locate the target workspace and click DataArts Factory. The DataArts Factory console is displayed.
                                                        3. On the Develop Job page, create a job, drag a CDM node and two Dummy nodes and drop them on the canvas in the right pane. Click and hold to connect the CDM node to the Dummy nodes, as shown in Figure 1.

                                                          Set the Failure Policy for the CDM node to Go to the next node.

                                                          -
                                                          Figure 2 Configuring the failure policy for the CDM node
                                                          +
                                                          1. Log in to the DataArts Studio console, locate the target DataArts Studio instance, and click Access on the instance card.
                                                          2. Click the Workspaces tab. In the workspace list, locate the target workspace and click DataArts Factory. The DataArts Factory console is displayed.
                                                          3. On the Develop Job page, create a job, drag a CDM node and two Dummy nodes and drop them on the canvas in the right pane. Click and hold to connect the CDM node to the Dummy nodes, as shown in Figure 1.

                                                            Set the Failure Policy for the CDM node to Go to the next node.

                                                            +
                                                            Figure 2 Configuring the failure policy for the CDM node

                                                          4. Right-click the connection line and select Set Condition. In the Edit EL Expression dialog box, enter the IF statement in the text box.

                                                            Each statement branch requires an IF statement. The IF statement is a ternary expression based on the EL expression syntax. If the result of the ternary expression is true, subsequent nodes will be connected. Otherwise, subsequent nodes will be skipped.

                                                            In this demo, the #{Job.getNodeStatus("node_name")} EL expression is used to obtain the execution status of a specified node. If the execution is successful, success is returned; otherwise, fail is returned. In this example, the IF statement expressions are as follows:

                                                            • The IF statement expression for branch A is #{(Job.getNodeStatus("CDM")) == "success" ?. "true" : "false"}
                                                            • The IF statement expression for branch B is #{(Job.getNodeStatus("CDM")) == "fail" ?. "true" : "false"}
                                                            -
                                                            After entering the IF statement expression, you can select either Skip all subsequent nodes or Skip the next node for Failure Policy. After the configuration is complete, click OK to save the job.
                                                            Figure 3 Configuring a failure policy
                                                            +
                                                            After entering the IF statement expression, you can select either Skip all subsequent nodes or Skip the next node for Failure Policy. After the configuration is complete, click OK to save the job.
                                                            Figure 3 Configuring a failure policy
                                                            -

                                                          5. Click Test to test the job and view the execution result on the Monitor Instance page.
                                                          6. After the job is executed, view the job instance running result on the Monitor Instance page. The execution result meets the expectation. If the execution result is fail, branch A is skipped and branch B is executed.

                                                            Figure 4 Job execution result
                                                            +

                                                          7. Click Test to test the job and view the execution result on the Monitor Instance page.
                                                          8. After the job is executed, view the job instance running result on the Monitor Instance page. The execution result meets the expectation. If the execution result is fail, branch A is skipped and branch B is executed.

                                                            Figure 4 Job execution result

                                                        Determining the IF Statement Branch to Be Executed Based on the Execution Result of the Previous Node

                                                        Scenario Description

                                                        @@ -27,48 +27,48 @@

                                                        In this scenario, the loop expression cannot be replaced by the StringUtil expression #{StringUtil.split(StringUtil.split(StringUtil.split(Job.getNodeOutput("Name of the previous node"),"]")[0],"[")[0],"\\"")[0]} because the StringUtil expression returns a string which cannot be compared with the standard data of the int type.

                                                        Figure 5 shows the job orchestration.

                                                        -
                                                        Figure 5 Example job
                                                        +
                                                        Figure 5 Example job

                                                        Key configurations of the For Each node are as follows:

                                                        • Dataset: Enter the execution result of the select statement on the Hive SQL node. Use the #{Job.getNodeOutput('HIVE')} expression, where HIVE is the name of the previous node.
                                                        • Subjob Parameter Name: Enter the parameter defined in the subjob. Transfer the output of the previous node of the main job to the sub-job for use. The variable name is result, and its value is a column in the dataset. The EL expression #{Loop.dataArray[0][0]} or #{Loop.current[]} is used. This example uses {Loop.dataArray[0][0]} as an example.

                                                        The sub-job selected on the For Each node determines the IF statement branch to be executed based on the subjob parameter transferred from the For Each node. Figure 6 shows the job orchestration.

                                                        -
                                                        Figure 6 Example sub-job
                                                        +
                                                        Figure 6 Example sub-job

                                                        The IF statement is the key configuration of the subjob. This example uses the expression ${result} to obtain the value of the job parameter.

                                                        Do not use the #{Job.getParam("job_param_name")} EL expression because this expression can only obtain the values of the parameters configured in the current job, but cannot obtain the parameter values transferred from the parent job or the global variables configured in the workspace. The expression only works for the current job.

                                                        To obtain the parameter values passed from the parent job and the global variables configured for the workspace, you are advised to use the ${job_param_name} expression.

                                                        Configuration Method

                                                        Developing a Subjob

                                                        -
                                                        1. Log in to the DataArts Studio console, locate the target DataArts Studio instance, and click Access on the instance card.
                                                        2. Click the Workspaces tab. In the workspace list, locate the target workspace and click DataArts Factory. The DataArts Factory console is displayed.
                                                        3. On the Develop Job page, create a data development subjob For Each. Drag four Dummy nodes and drop them on the canvas, click and hold to connect them, as shown in Figure 6.
                                                        4. Right-click the connection line and select Set Condition. In the Edit EL Expression dialog box, enter the IF statement in the text box.

                                                          Each statement branch requires an IF statement. The IF statement is a ternary expression based on the EL expression syntax. If the result of the ternary expression is true, subsequent nodes will be connected. Otherwise, subsequent nodes will be skipped.

                                                          +
                                                          1. Log in to the DataArts Studio console, locate the target DataArts Studio instance, and click Access on the instance card.
                                                          2. Click the Workspaces tab. In the workspace list, locate the target workspace and click DataArts Factory. The DataArts Factory console is displayed.
                                                          3. On the Develop Job page, create a data development subjob For Each. Drag four Dummy nodes and drop them on the canvas, click and hold to connect them, as shown in Figure 6.
                                                          4. Right-click the connection line and select Set Condition. In the Edit EL Expression dialog box, enter the IF statement in the text box.

                                                            Each statement branch requires an IF statement. The IF statement is a ternary expression based on the EL expression syntax. If the result of the ternary expression is true, subsequent nodes will be connected. Otherwise, subsequent nodes will be skipped.

                                                            • For the >5 branch, the IF statement expression is #{${result} > 5 ? "true" : "false"}.
                                                            • For the =5 branch, the IF statement expression is #{${result} == 5 ? "true" : "false"}.
                                                            • For the <5 branch, the IF statement expression is #{${result} < 5 ? "true" : "false"}.

                                                            After entering the IF statement expression, you can select either Skip all subsequent nodes or Skip the next node for Failure Policy.

                                                            If an expression contains multiple conditions, you can use || to combine them conditions. The following is an example:

                                                            #{(${result} >= 19 || ${result} <=9) ? "true" : "false"}

                                                            -

                                                          5. Configure job parameters. Set the parameter name to result. This parameter is only used by the For Each node in the main job testif to identify subjob parameters. You do not need to set the parameter value.

                                                            Figure 7 Configuring job parameters
                                                            +

                                                          6. Configure job parameters. Set the parameter name to result. This parameter is only used by the For Each node in the main job testif to identify subjob parameters. You do not need to set the parameter value.

                                                            Figure 7 Configuring job parameters

                                                          7. Save the job.

                                                        Developing a Job

                                                        -
                                                        1. On the Develop Job page, create a data development job named testif. Drag a HIVE SQL node and a For Each node and drop them on the canvas. Click and hold to connect the nodes, as shown in Figure 5.
                                                        2. Configure properties for the HIVE SQL node. Reference the following SQL script (there is no special requirement for other properties):

                                                          --Obtain the number of people whose scores are higher than 85 from the student_score table.
                                                          +
                                                          1. On the Develop Job page, create a data development job named testif. Drag a HIVE SQL node and a For Each node and drop them on the canvas. Click and hold to connect the nodes, as shown in Figure 5.
                                                          2. Configure properties for the HIVE SQL node. Reference the following SQL script (there is no special requirement for other properties):

                                                            --Obtain the number of people whose scores are higher than 85 from the student_score table.
                                                             SELECT count(*) FROM student_score WHERE score> "85" ;
                                                            -
                                                            Figure 8 HIVE SQL script execution result
                                                            +
                                                            Figure 8 HIVE SQL script execution result

                                                          3. Configure properties for the For Each node.

                                                            • Subjob in a Loop: Select foreach, the subjob that has been developed.
                                                            • Dataset: Enter the execution result of the select statement on the Hive SQL node. Use the #{Job.getNodeOutput('HIVE')} expression, where HIVE is the name of the previous node.
                                                            • Subjob Parameter Name: Enter the parameter defined in the subjob. Transfer the output of the previous node of the main job to the sub-job for use. The variable name is result (parameter name of the subjob), and its value is a column in the dataset. The EL expression #{Loop.dataArray[0][0]} is used.
                                                            -
                                                            Figure 9 Properties of the For Each node
                                                            +
                                                            Figure 9 Properties of the For Each node

                                                          4. Save the job.

                                                          Testing the Main Job

                                                          -
                                                          1. Click Test above the canvas to test the main job. After the main job is executed, the subjob is automatically invoked through the For Each node and executed.
                                                          2. In the navigation pane on the left, choose Monitor Instance to view the job execution result.
                                                          3. After the job is executed, view the execution result of the subjob foreach on the Monitor Instance page. The execution result meets the expectation. Currently, the execution result of the Hive SQL statement is 4. Therefore, the >5 and =5 branches are skipped, and the <5 branch is successfully executed.

                                                            Figure 10 Execution result of the subjob
                                                            +
                                                            1. Click Test above the canvas to test the main job. After the main job is executed, the subjob is automatically invoked through the For Each node and executed.
                                                            2. In the navigation pane on the left, choose Monitor Instance to view the job execution result.
                                                            3. After the job is executed, view the execution result of the subjob foreach on the Monitor Instance page. The execution result meets the expectation. Currently, the execution result of the Hive SQL statement is 4. Therefore, the >5 and =5 branches are skipped, and the <5 branch is successfully executed.

                                                              Figure 10 Execution result of the subjob

                                                            Configuring the Policy for Executing a Node with Multiple IF Statements

                                                            If the execution of a node depends on multiple IF statements, the policy for executing the node can be AND or OR.

                                                            If you choose the OR policy, the node will be executed if any one of the IF statements is met.

                                                            If you choose the AND policy, the node will be executed only if all of the IF statements are met.

                                                            If you choose neither, the OR policy will be used.

                                                            -
                                                            Figure 11 A job with multiple IF statements
                                                            +
                                                            Figure 11 A job with multiple IF statements

                                                            Configuration Method

                                                            Configure the execution policy.

                                                            1. Log in to the DataArts Studio console, locate the target DataArts Studio instance, and click Access on the instance card.
                                                            2. Click the Workspaces tab. In the workspace list, locate the target workspace and click DataArts Factory. The DataArts Factory console is displayed.
                                                            3. On the DataArts Factory console, choose Configuration > Configure > Default Configuration.
                                                            4. Select AND or OR for Multi-IF Policy.
                                                            5. Click Save.

                                                            Develop a job.

                                                            -
                                                            1. On the Develop Job page, create a data development job.
                                                            2. Drag three DWS SQL operators as parent nodes and one Python operator as a child node to the canvas. Click and hold to connect the nodes to orchestrate the job shown in Figure 11.
                                                            3. Right-click the connection line and select Set Condition. In the Edit EL Expression dialog box, enter the IF statement in the text box.

                                                              Each statement branch requires an IF statement. The IF statement is a ternary expression based on the EL expression syntax.

                                                              +
                                                              1. On the Develop Job page, create a data development job.
                                                              2. Drag three DWS SQL operators as parent nodes and one Python operator as a child node to the canvas. Click and hold to connect the nodes to orchestrate the job shown in Figure 11.
                                                              3. Right-click the connection line and select Set Condition. In the Edit EL Expression dialog box, enter the IF statement in the text box.

                                                                Each statement branch requires an IF statement. The IF statement is a ternary expression based on the EL expression syntax.

                                                                • The IF statement expression for the test1 node is #{(Job.getNodeStatus("test1")) == "success" ? "true" : "false"},
                                                                • The IF statement expression for the test2 node is #{(Job.getNodeStatus("test2")) == "success" ? "true" : "false"},
                                                                • The IF statement expression for the test3 node is #{(Job.getNodeStatus("test3")) == "success" ? "true" : "false"},

                                                                The expression of each node is determined using the IF statement based on the execution status of the previous node.

                                                                After entering the IF statement expression, you can select either Skip all subsequent nodes or Skip the next node for Failure Policy.

                                                                @@ -78,9 +78,9 @@ SELECT count(*) FROM student_score WHERE score> "85" ;

                                                          If test2 is executed successfully, the corresponding IF statement is true.

                                                          If test3 fails to be executed, the corresponding IF statement is false.

                                                          If Multi-IF Policy is set to OR, the showtables node is executed and the job execution is complete.

                                                          -
                                                          Figure 12 How the job runs if Multi-IF Policy is OR
                                                          +
                                                          Figure 12 How the job runs if Multi-IF Policy is OR

                                                          If Multi-IF Policy is set to AND, the showtables node is skipped and the job execution is complete.

                                                          -
                                                          Figure 13 How the job runs if Multi-IF Policy is AND
                                                          +
                                                          Figure 13 How the job runs if Multi-IF Policy is AND

                                                        @@ -90,3 +90,10 @@ SELECT count(*) FROM student_score WHERE score> "85" ; + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0584.html b/docs/dataartsstudio/umn/dataartsstudio_01_0584.html index d665813f7..b28eecf5e 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0584.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0584.html @@ -38,7 +38,7 @@
                                                        In this example, the MRS Hive SQL node returns a two-dimensional array that contains a single field. The data sent by the Kafka Client node is defined as the StringUtil EL expression with an embedded object. You can use this expression to split the two-dimensional array and obtain the output field value of the MRS Hive SQL node.

                                                        To make it easy to view the obtained value, this example uses the Kafka Client node. In practice, you can select a subsequent node type as needed. By using a StringUtil EL expression with an embedded object on the node, you can obtain the data value returned by the previous node.

                                                        -
                                                        Figure 1 Example job
                                                        +
                                                        Figure 1 Example job
                                                        The key configuration of the Kafka Client node is the Sent Content parameter. Set it as follows:
                                                        #{StringUtil.split(StringUtil.split(StringUtil.split(Job.getNodeOutput("count95"),"]")[0],"[")[0],"\\"")[0]}

                                                        Configuration Method

                                                        @@ -58,13 +58,13 @@ VALUES ('CEHN', '99');

                                                      8. Create the Hive SQL script to be invoked by the MRS Hive SQL node. Create a Hive SQL script named count95, select a Hive connection and database, paste the following SQL statement, and submit a version.

                                                        --Obtain the number of students whose scores are higher than 95 from the student_score table.--
                                                         SELECT count(*) FROM student_score WHERE score> "95" ; 
                                                        -

                                                      9. On the Develop Job page, create a data development job. Drag an MRS Hive SQL node and a Kafka Client node and drop them on the canvas. Click and hold to connect the nodes, as shown in Figure 1.
                                                      10. Configuring parameters for an MRS Hive SQL node Select the count95 script submitted in 4 for SQL script and select a Hive connection and database.

                                                        Figure 2 Configuring parameters for an MRS Hive SQL node
                                                        +

                                                      11. On the Develop Job page, create a data development job. Drag an MRS Hive SQL node and a Kafka Client node and drop them on the canvas. Click and hold to connect the nodes, as shown in Figure 1.
                                                      12. Configuring parameters for an MRS Hive SQL node Select the count95 script submitted in 4 for SQL script and select a Hive connection and database.

                                                        Figure 2 Configuring parameters for an MRS Hive SQL node

                                                        -

                                                      13. Configure parameters for the Kafka Client node. Set Sent Content to #{StringUtil.split(StringUtil.split(StringUtil.split(Job.getNodeOutput("count95"),"]")[0],"[")[0],"\\"")[0]} and select a Kafka connection and a topic name.

                                                        Figure 3 Configuring parameters for the Kafka Client node
                                                        +

                                                      14. Configure parameters for the Kafka Client node. Set Sent Content to #{StringUtil.split(StringUtil.split(StringUtil.split(Job.getNodeOutput("count95"),"]")[0],"[")[0],"\\"")[0]} and select a Kafka connection and a topic name.

                                                        Figure 3 Configuring parameters for the Kafka Client node

                                                      15. After the node configuration is complete, click Test. After the job test is successful, right-click the Kafka Client node to view its log. You can find that the two-dimensional array [["2"]] returned by the MRS Hive SQL node has been converted to 2.

                                                        You can set Sent Content of the Kafka Client node to #{Job.getNodeOutput("count95")} and run the job. Then you can view the log of the Kafka Client node to verify that the result returned by the MRS Hive SQL node is two-dimensional array [["2"]].

                                                        -
                                                        Figure 4 Check the Kafka Client node logs.
                                                        +
                                                        Figure 4 Check the Kafka Client node logs.

                                                      16. @@ -75,9 +75,9 @@ SELECT count(*) FROM student_score WHERE score> "95" ;
                                                        Orchestrate the main job shown in Figure 5. Key configurations of the For Each node are as follows:
                                                        • Dataset: Enter the execution result of the select statement on the Hive SQL node. Use the #{Job.getNodeOutput("select95")} expression, where select95 is the name of the previous node.
                                                        • Subjob Parameter Name: Enter the parameter name defined in the subjob. Transfer the parameter value defined in the main job to the subjob. Set the subjob parameter names to name and score, whose values are those in the first and second columns in the dataset, respectively. EL expressions #{Loop.current[0]} and #{Loop.current[1]} are used.
                                                        -
                                                        Figure 5 Example main job
                                                        +
                                                        Figure 5 Example main job

                                                        For the subjobs selected for the For Each node, you must set their parameter names so that the main job can identify the parameter definitions.

                                                        -
                                                        Figure 6 Example subjob
                                                        +
                                                        Figure 6 Example subjob

                                                        Configuration Method

                                                        Developing a Subjob

                                                        @@ -85,7 +85,7 @@ SELECT count(*) FROM student_score WHERE score> "95" ;

                                                      17. Configure parameters for the Kafka Client node. Set Sent Content to ${name}: ${score} and select a Kafka connection and a topic name.

                                                        Do not use the #{Job.getParam("job_param_name")} EL expression because this expression can only obtain the values of the parameters configured in the current job, but cannot obtain the parameter values transferred from the parent job or the global variables configured in the workspace. The expression only works for the current job.

                                                        To obtain the parameter values passed from the parent job and the global variables configured for the workspace, you are advised to use the ${job_param_name} expression.

                                                        -
                                                        Figure 7 Configuring parameters for the Kafka Client node
                                                        +
                                                        Figure 7 Configuring parameters for the Kafka Client node

                                                      18. Submit the subjob after the configuration is complete.
                                                      19. @@ -106,16 +106,16 @@ VALUES ('CEHN', '99');

                                                      20. Create the Hive SQL script to be invoked by the MRS Hive SQL node. Create a Hive SQL script named select95, select a Hive connection and database, paste the following SQL statement, and submit a version.

                                                        --Display the names and scores of students whose scores are higher than 95 in the student_score table.--
                                                         SELECT * FROM student_score WHERE score> "95" ; 
                                                        -

                                                      21. On the Develop Job page, create a data development job named EL_test_master. Drag a HIVE SQL node and a For Each node and drop them on the canvas. Click and hold to connect the nodes, as shown in Figure 5.
                                                      22. Configure parameters for the MRS Hive SQL node. Select the select95 script submitted in 3 for SQL script and select a Hive connection and database.

                                                        Figure 8 Configuring parameters for an MRS Hive SQL node
                                                        +

                                                      23. On the Develop Job page, create a data development job named EL_test_master. Drag a HIVE SQL node and a For Each node and drop them on the canvas. Click and hold to connect the nodes, as shown in Figure 5.
                                                      24. Configure parameters for the MRS Hive SQL node. Select the select95 script submitted in 3 for SQL script and select a Hive connection and database.

                                                        Figure 8 Configuring parameters for an MRS Hive SQL node

                                                      25. Configure properties for the For Each node.

                                                        • Subjob in a Loop: Select EL_test_slave, the subjob that has been developed.
                                                        • Dataset: Enter the execution result of the select statement on the Hive SQL node. Use the #{Job.getNodeOutput("select95")} expression, where select95 is the name of the previous node.
                                                        • Subjob Parameter Name: Enter the parameter name defined in the subjob. Transfer the parameter value defined in the main job to the subjob. Set the subjob parameter names to name and score, whose values are those in the first and second columns in the dataset, respectively. EL expressions #{Loop.current[0]} and #{Loop.current[1]} are used.
                                                        -
                                                        Figure 9 Configuring properties for the For Each node
                                                        +
                                                        Figure 9 Configuring properties for the For Each node

                                                      26. Save the job.
                                                      27. Testing the Main Job

                                                        -
                                                        1. Click Test above the main job EL_test_master canvas to test the job. After the main job is executed, the subjob EL_test_slave is cyclically invoked through the For Each node and executed.
                                                        2. In the navigation pane on the left, choose Monitor Instance to view the job execution result.
                                                        3. After the job is executed, view the cyclic execution result of the subjob EL_test_slave on the Monitor Instance page.

                                                          Figure 10 Execution result of the subjob
                                                          +
                                                          1. Click Test above the main job EL_test_master canvas to test the job. After the main job is executed, the subjob EL_test_slave is cyclically invoked through the For Each node and executed.
                                                          2. In the navigation pane on the left, choose Monitor Instance to view the job execution result.
                                                          3. After the job is executed, view the cyclic execution result of the subjob EL_test_slave on the Monitor Instance page.

                                                            Figure 10 Execution result of the subjob

                                                            -

                                                          4. View the log of the cyclic execution of subjob EL_test_slave. The log shows that the output values of the previous node of the For Each node was obtained through the For Each node and the EL expression with a Loop embedded object.

                                                            Figure 11 Viewing the log
                                                            +

                                                          5. View the log of the cyclic execution of subjob EL_test_slave. The log shows that the output values of the previous node of the For Each node was obtained through the For Each node and the EL expression with a Loop embedded object.

                                                            Figure 11 Viewing the log

                                                          @@ -125,3 +125,10 @@ SELECT * FROM student_score WHERE score> "95" ; + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0585.html b/docs/dataartsstudio/umn/dataartsstudio_01_0585.html index b894c274a..71e2cb2c9 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0585.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0585.html @@ -6,7 +6,7 @@
                                                          • In addition to SQL scripts, PatchData supports other nodes.
                                                          • If the content of a SQL script changes, the PatchData job runs the latest script.
                                                          • When you use PatchData, if the variable in the SQL statement is DATE, enter ${DATE} in the script. The script parameter DATE is then automatically added to the job parameters, and its value can be an EL expression. If the variable is a time variable, enter the expression of the DateUtil embedded object. The platform automatically converts the expression into a historical date.
                                                          • PatchData jobs support script parameters and global environment variables as well as job parameters.
                                                          -

                                                          Constraints

                                                          • PatchData is available only when periodic scheduling is configured for the data development job.
                                                          +

                                                          Constraints

                                                          PatchData is available only when periodic scheduling is configured for the data development job.

                                                          Example

                                                          Scenario

                                                          Among the product data tables of a company, there is a source data table A that records the product sales amount. To import the historical product sales amount to the destination table B, you can create a PatchData job.

                                                          @@ -39,27 +39,27 @@ INSERT INTO A VALUES ('1','60', '2022-02-27'); INSERT INTO A VALUES ('2','45', '2022-02-27');
                                                      28. Develop a PatchData script. Ensure that the script expression contains a time variable. (For example, if the variable in the SQL statement is DATE, enter ${DATE} in the script.) You can set the expression for script parameter DATE in job parameter settings in 3.
                                                        On the Develop Script page, enter following statement in the editor:
                                                        INSERT INTO B (SELECT * FROM A WHERE DATE = ${DATE})
                                                        -
                                                        Figure 1 Developing a script
                                                        +
                                                        Figure 1 Developing a script

                                                        After compiling the script, save it and submit the latest version.

                                                      29. Develop a PatchData batch processing job. When developing the job, you need to configure the node attributes and scheduling period.

                                                        In the left navigation pane of the DataArts Factory console, choose Data Development > Develop Job.

                                                        -
                                                        Figure 2 Node parameters
                                                        +
                                                        Figure 2 Node parameters

                                                        -
                                                        • If the job-associated SQL script uses a parameter, the parameter name (such as DATE) is displayed. Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.

                                                          If the parameter is time, view the example expression of the DateUtil embedded object. The platform automatically replaces the parameter with the historical date of the patch data (determined by the service date of the patch data).

                                                          +
                                                          • If the job-associated SQL script uses a parameter, the parameter name (such as DATE) is displayed. Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.

                                                            If the parameter is time, view the example expression of the DateUtil embedded object. The platform automatically replaces the parameter with the historical date of the patch data (determined by the service date of the patch data).

                                                            You can also directly enter a SQL expression.

                                                            -
                                                          • If the parameters of the associated SQL script change, you can click to synchronize the change or click to edit the parameters.
                                                          • The following is an example of script parameters:
                                                            Example: #{DateUtil.format(DateUtil.addDays(Job.planTime,-1),'yyyy-MM-dd')}
                                                            • Job.planTime indicates the planned job time, and yyyy-MM-dd indicates the time format.
                                                            • If the planned job time is March 2, the previous day is March 1. The planned job time will be replaced by the configured patch data service date.
                                                            • The Job.planTime is converted into a time in the yyyy-MM-dd format using an expression.
                                                            +
                                                          • If the parameters of the associated SQL script change, you can click to synchronize the change or click to edit the parameters.
                                                          • The following is an example of script parameters:
                                                            Example: #{DateUtil.format(DateUtil.addDays(Job.planTime,-1),'yyyy-MM-dd')}
                                                            • Job.planTime indicates the planned job time, and yyyy-MM-dd indicates the time format.
                                                            • If the planned job time is March 2, the previous day is March 1. The planned job time will be replaced by the configured patch data service date.
                                                            • The Job.planTime is converted into a time in the yyyy-MM-dd format using an expression.

                                                          Configure the scheduling period of the PatchData job. Click Scheduling Setup and set Scheduling Frequency to Every day.

                                                          -
                                                          Figure 3 Configuring the scheduling period
                                                          +
                                                          Figure 3 Configuring the scheduling period

                                                          • If Scheduling Frequency is set to Every day, the job is scheduled every day, and a PatchData instance is generated. You can view the statuses of PatchData instances on the Monitor Instance page. On the Monitor Instance page, view the instance information about the job and perform more operations on instances as required.
                                                          • The job scheduling time takes effect from March 9, 2023, and the job is scheduled at 02:00 every day.
                                                          • Run the following SQL statement to check whether destination table B contains data of source table A:

                                                            SELECT * FROM B

                                                          After configuring the parameters, save and submit the latest version of the job and test the job.

                                                          Click Execute to run the job.

                                                          -
                                                        • Create a PatchData task.
                                                          After creating a periodic job, you need to configure PatchData for the job.
                                                          1. In the left navigation pane of DataArts Factory, choose Monitoring > Monitor Job.
                                                          2. Click the Batch Job Monitoring tab. In the Operation column of the job, choose More > Configure PatchData. The Configure PatchData page is displayed.
                                                            If you want to supplement historical data from February 27, 2023 to March 1, 2023, set Date to Feb 28, 2023 00:00:00 – Mar 02, 2023 23:59:59. The system automatically transfers the configured date to the planned job time. In the expression of the script time variable DATE, the defined time is the planned job time minus one day. That is, the time of the day before the planned job time is the time range (Feb 27, 2023 to Mar 1, 2023) for PatchData.
                                                            Figure 4 Configuring PatchData
                                                            +
                                                          3. Create a PatchData task.
                                                            After creating a periodic job, you need to configure PatchData for the job.
                                                            1. In the left navigation pane of DataArts Factory, choose Monitoring > Job Monitoring.
                                                            2. Click the Batch Job Monitoring tab. In the Operation column of the job, choose More > Configure PatchData. The Configure PatchData page is displayed.
                                                              If you want to supplement historical data from February 27, 2023 to March 1, 2023, set Date to Feb 28, 2023 00:00:00 – Mar 02, 2023 23:59:59. The system automatically transfers the configured date to the planned job time. In the expression of the script time variable DATE, the defined time is the planned job time minus one day. That is, the time of the day before the planned job time is the time range (Feb 27, 2023 to Mar 1, 2023) for PatchData.
                                                              Figure 4 Configuring PatchData

                                                              @@ -104,7 +104,8 @@ INSERT INTO A VALUES ('2','45', '2022-02-27');
                                                      30. Table 3 Parameters for rerunning a job

                                                        Parameter

                                                        +
                                                        - - - - - - - - - - - - - - - @@ -221,12 +264,12 @@ -

                                                        Viewing the DAG

                                                        You can view the dependency between instances and perform O&M operations on the DAG.

                                                        -
                                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                        2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                        3. In the navigation pane on the left of the DataArts Factory page, choose Monitoring > Monitor Instance
                                                        4. Locate the row that contains a job and click DAG in the Operation column.
                                                          Figure 2 DAG
                                                          +

                                                          Viewing the DAG

                                                          You can view the dependency between job instances and perform O&M operations on the DAG.

                                                          +
                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          3. In the navigation pane on the left of the DataArts Factory page, choose Monitoring > Monitor Instance
                                                          4. Locate the row that contains a job and click DAG in the Operation column.
                                                            Figure 7 DAG

                                                            By default, the DAG displays the current job instance and its upstream and downstream job instances. It supports the following operations:

                                                            -
                                                            • Click in the upper right corner of the DAG to restore the DAG to the initial state, and click to close the DAG. Drag in the upper left corner of the DAG to change its width.
                                                            • Click a job instance to select it.
                                                              Figure 3 Selecting a job instance
                                                              +
                                                              • Click in the upper right corner of the DAG to restore the DAG to the initial state, and click to close the DAG. Drag in the upper left corner of the DAG to change its width.
                                                              • Click a job instance to select it.
                                                                Figure 8 Selecting a job instance
                                                                • When a job instance is selected, the background colors of the job instance and its upstream and downstream instances are darkened.
                                                                • Brief information about the instance is displayed in the lower right corner of the DAG. The instance name and ID can be directly copied.
                                                                • Click Show Details to open the details panel, which displays information such as the instance attributes, job parameters, node list, and historical instances. You can adjust the height of the panel or close it.
                                                                • Click the blank area to deselect the job instance.
                                                                -
                                                              • Right-click a job instance to expand its upstream and downstream job instances. You can stop, rerun, continue to execute instances, forcibly make instances succeed, analyze the upstream node, and edit the job.
                                                                Figure 4 Performing operations on job instances
                                                                +
                                                              • Right-click a job instance to expand its upstream and downstream job instances. You can stop, rerun, continue to execute instances, forcibly make instances succeed, analyze the upstream node, and edit the job.
                                                                Figure 9 Performing operations on job instances

                                                          @@ -251,6 +294,7 @@
                                                        @@ -289,7 +333,7 @@ - @@ -303,3 +347,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0514.html b/docs/dataartsstudio/umn/dataartsstudio_01_0514.html index 26d49bcb9..fe365b022 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0514.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0514.html @@ -2,106 +2,62 @@

                                                        Managing Notifications

                                                        You can configure job notification tasks to notify you of job success or failures.

                                                        -

                                                        Configuring a Notification

                                                        Before configuring a notification for a job:

                                                        +

                                                        Configuring a Notification

                                                        Before configuring a notification for a job:

                                                        • Message notification has been enabled and a topic has been configured.
                                                        • A job not in Not Activated status has been submitted.
                                                        -
                                                        1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                        2. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                        3. On the Notification Management tab page, click Configure Notification. In the displayed dialog box, configure parameters. Table 1 describes the parameters. -
                                                        Table 3 Parameters for rerunning a job

                                                        Parameter

                                                        Description

                                                        +

                                                        Description

                                                        Rerun Type

                                                        +

                                                        Rerun Type

                                                        Type of the instance that you want to rerun.

                                                        +

                                                        Type of the instance that you want to rerun.

                                                        • Rerun selected instance
                                                        • Rerun instances of selected job and its upstream and downstream jobs

                                                        Start Time

                                                        +

                                                        Start Time

                                                        Time range in which instances have been run

                                                        +

                                                        This parameter is required only when Rerun Type is set to Rerun instances of selected job and its upstream and downstream jobs.

                                                        +

                                                        After you set the start time and end time, the system will rerun all the job instances in the specified period.

                                                        +
                                                        NOTE:

                                                        If no job instance can be rerun in the specified period, error message "Job xxx have no instances to rerun" will be displayed.

                                                        +

                                                        List of Rerun Job Instances

                                                        +

                                                        List of Rerun Job Instances

                                                        Upstream and downstream jobs to rerun. You can select multiple jobs at a time.

                                                        -

                                                        The job dependency graph is displayed. For details about how to perform operations on the job dependency graph, see Batch Processing: Viewing a Job Dependency Graph.

                                                        +

                                                        This parameter is required only when Rerun Type is set to Rerun instances of selected job and its upstream and downstream jobs.

                                                        +

                                                        You can select Display the current job and its directly connected jobs or Display complete dependency graphs in the Scheduling-State Job Dependency View dialog box.

                                                        +

                                                        The job dependency view is displayed. You can enter a job name to query the job dependency.

                                                        +
                                                        Figure 3 Job Dependency page
                                                        +

                                                        Select the job to rerun and its upstream and downstream jobs. You can select multiple jobs at a time.

                                                        +
                                                        NOTE:

                                                        If you hover over the question mark on the right of Scheduling-State Job Dependency View, the following information is displayed:

                                                        +
                                                        • When you hover your cursor on a job, its upstream and downstream jobs will be marked blue and yellow, respectively.
                                                        • Drag the blank area to view the complete relationship graph.
                                                        • Click a job in the relationship graph to select all the instances within the duration of the job.
                                                          Figure 4 Rerunning all instances
                                                          +
                                                        • Right-click the job to view its instances, and select and run them again.
                                                          Figure 5 Rerunning some instances
                                                          +
                                                        • If no job instance is selected, No instance selected is displayed.
                                                          Figure 6 No instance selected
                                                          +
                                                        +
                                                        +

                                                        For detailed operations on the job dependency graph, see Batch Job Monitoring: Viewing a Job Dependency Graph.

                                                        Rerun From

                                                        +

                                                        Rerun From

                                                        Start position from which the job instance reruns.

                                                        -
                                                        • Error node: When a job instance fails to be run, it reruns since the error node of the job instance.
                                                        • The first node: When a job instance fails to be run, it reruns since the first node of the job instance.
                                                        • Specified node: When a job instance fails to run, it reruns since the node specified in the job instance. This option is available only if Rerun Type is set to Rerun selected instance.
                                                        +

                                                        Start position from which the job instance reruns.

                                                        +
                                                        • Error node: When a job instance fails to be run, it reruns since the error node of the job instance.
                                                        • The first node: When a job instance fails to be run, it reruns since the first node of the job instance.
                                                        • Specified node: When a job instance fails to run, it reruns since the node specified in the job instance. This option is available only if Rerun Type is set to Rerun selected instance.
                                                        NOTE:

                                                        A job instance reruns from its first node if either of the following cases occurs:

                                                        • The quantity or name of a node in the job changes.
                                                        • The job instance has been successfully run.

                                                        Parameters to Use

                                                        +

                                                        Parameters to Use

                                                        • Parameters of the original job
                                                        • Parameters of the latest job
                                                        +
                                                        • Parameters of the original job
                                                        • Parameters of the latest job

                                                        Concurrent Instances

                                                        +

                                                        Concurrent Instances

                                                        Number of job instances that can be concurrently processed.

                                                        +

                                                        This parameter is required only when Rerun Type is set to Rerun instances of selected job and its upstream and downstream jobs.

                                                        +

                                                        It indicates the number of job instances that can be concurrently processed. The value cannot be less than 1. The default value is 1.

                                                        Ignore OBS Listening

                                                        +

                                                        Ignore OBS Listening

                                                        • Yes: The system does not listen to the OBS path when rerunning the job instance.
                                                        • No: The system listens to the OBS path when rerunning the job instance.
                                                        +

                                                        The default value is Yes.

                                                        +
                                                        • Yes: The system does not listen to the OBS path when rerunning the job instance.
                                                        • No: The system listens to the OBS path when rerunning the job instance.
                                                          NOTE:

                                                          If this parameter is not used, ignore it.

                                                          +
                                                          +

                                                        Successful

                                                        The service logic of a job is successfully executed (including the success of retry upon failure).

                                                        +

                                                        Successful execution statuses include Successful, Forcibly successful, and Failure ignored.

                                                        Forcibly successful

                                                        @@ -261,14 +305,14 @@

                                                        Failure ignored

                                                        As shown in the following figure, a failure handling policy is configured to skip node B and continue to execute node C if node B fails. When the job is executed successfully, the job instance is in Failure ignored state.

                                                        -
                                                        Figure 5 Failure handling policy – Go to the next node
                                                        +
                                                        Figure 10 Failure handling policy – Go to the next node

                                                        Abnormal

                                                        There are few scenarios where this status is displayed. As shown in the following figure, a failure handling policy is configured to suspend the job instance immediately without continuing to execute node C. In this case, the job instance is in Abnormal state.

                                                        -
                                                        Figure 6 Failure handling policy – Suspend current job execution plan
                                                        +
                                                        Figure 11 Failure handling policy – Suspend current job execution plan

                                                        Failed

                                                        A job fails to be executed.

                                                        +

                                                        A job fails to be executed. If a job fails to be executed, you can view the failure cause, for example, a node of the job fails to be executed.

                                                        - - @@ -93,6 +94,7 @@ @@ -104,7 +106,7 @@ + + + +
                                                        Table 1 Notification parameters

                                                        Parameter

                                                        +
                                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                        2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                        3. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                        4. On the Manage Notification tab page, click Configure Notification. In the displayed dialog box, configure parameters. Table 1 describes the parameters.

                                                          +
                                                          Figure 1 Configuring notifications
                                                          + +
                                                          - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - @@ -110,22 +66,37 @@
                                                        5. Click OK.
                                                        6. Editing a Notification

                                                          After a notification is created, you can modify the notification parameters as required.

                                                          -
                                                          1. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                          2. Click the Notification Management tab.
                                                          3. In the Operation column of a notification, click Edit. In the displayed dialog box, edit notification parameters. Table 1 describes the notification parameters.
                                                          4. Click Yes.
                                                          +
                                                          1. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                          2. Click the Manage Notification tab.
                                                          3. In the Operation column of a notification, click Edit. In the displayed dialog box, edit notification parameters. Table 1 lists the notification parameters.

                                                            +
                                                            Figure 2 Editing a job
                                                            +
                                                          4. Click Yes.

                                                          Disabling a Notification

                                                          You can disable the notification function on the Edit Notification page or in the notification list.

                                                          -
                                                          1. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                          2. Click the Notification Management tab.
                                                          3. In the Notification Function column, click . When it changes to , the notification function is disabled.
                                                          +
                                                          1. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                          2. Click the Manage Notification tab.
                                                          3. In the Notification column, click . When it changes to , the notification function is disabled.
                                                            Figure 3 Disabling a Notification
                                                            +

                                                            +

                                                          Viewing a Notification

                                                          You can view all notification information on the Notification Records tab page.

                                                          -
                                                          1. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                          2. Click the Notification Records tab.
                                                          +
                                                          1. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                          2. Click the Notification Records tab. You can only view data of the last 30 days.
                                                            Figure 4 Viewing notification records
                                                            +

                                                            +

                                                          Deleting a Notification

                                                          If you no longer need a notification, perform the following operations to delete it:

                                                          -
                                                          1. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                          2. Click the Notification Management tab.
                                                          3. You can delete a notification in either of the following ways:
                                                            • In the Operation column of a notification, click Delete.
                                                            • Select the notifications to delete and click Batch Delete above the notification list.
                                                            +
                                                            1. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                            2. Click the Manage Notification tab.
                                                            3. You can delete a notification in either of the following ways:
                                                              Figure 5 Deleting a notification
                                                              +

                                                              +
                                                              • In the Operation column of a notification, click Delete.
                                                              • Select the notifications to delete and click Batch Delete above the notification list.
                                                            4. In the displayed dialog box, click OK.
                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0515.html b/docs/dataartsstudio/umn/dataartsstudio_01_0515.html index cc38832e1..f1b3004e3 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0515.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0515.html @@ -7,68 +7,68 @@

                                                          Prerequisites

                                                          • Simple Message Notification (SMN) has been enabled, topics have been configured, and subscriptions have been added to the topics.
                                                          • Jobs are not in Not started status and have been submitted.
                                                          • OBS has been enabled and a folder has been created in OBS.
                                                          -

                                                          Creating a Notification

                                                          1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          2. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                          3. On the Cycles tab page, click Create Notification. In the displayed dialog box, configure parameters. Table 1 describes the notification parameters.
                                                            Figure 1 Create a notification
                                                            +

                                                            Creating a Notification

                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                            2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            3. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                            4. On the Cycles tab page, click Create Notification. In the displayed dialog box, configure parameters. Table 1 describes the notification parameters.
                                                              Figure 1 Create a notification

                                                              -
                                                          Table 1 Notification parameters

                                                          Parameter

                                                          Mandatory

                                                          +

                                                          Mandatory

                                                          Description

                                                          +

                                                          Description

                                                          Notification Scope

                                                          +

                                                          Job Name

                                                          Yes

                                                          +

                                                          Yes

                                                          Notification scope. Available options include:

                                                          -
                                                          • One job: Notifications are sent for a single job.
                                                          • All jobs: Notifications are sent for all jobs.
                                                          +

                                                          Name of the job.

                                                          Job Name

                                                          +

                                                          Notification Type

                                                          Yes

                                                          +

                                                          Yes

                                                          Name of the job.

                                                          -

                                                          Notification Type

                                                          -

                                                          Yes

                                                          -

                                                          Type of the notification.

                                                          +

                                                          Type of the notification.

                                                          • When Notification Scope is One job, available options for this parameter include:
                                                            • Abnormal: When a job is not running properly or fails, a notification is sent to notify the user of the abnormality.
                                                              You can set Max. Notifications and Min. Notification Interval (min). After a job encounters an exception or fails and before it is recovered, you can send the interval for sending alarm notifications.
                                                              NOTE:

                                                              You can set Max. Notifications to a value from 1 to 50. If the default value 1 is used, Min. Notification Interval (min) is unavailable.

                                                              You can set Min. Notification Interval (min) to a value from 5 to 60.

                                                              -
                                                            • Successful: When a job runs successfully, a notification is sent to notify the user of the success.
                                                            • Uncompleted: This function supports only the jobs scheduled by day. If the job execution time is later than the configured time by which the job has not finished, a notification is sent.
                                                            • Cancellation: When a job is canceled, a notification is sent.
                                                              NOTE:

                                                              An alarm notification is sent when a job being scheduled or a running job instance is manually stopped.

                                                              +
                                                            • Successful: When a job runs successfully, a notification is sent to notify the user of the success.
                                                            • Uncompleted: This function supports only the jobs scheduled by day. If the job execution time is later than the configured time by which the job has not finished, a notification is sent.
                                                            • Cancellation: When a job is canceled, a notification is sent.
                                                              NOTE:

                                                              An alarm notification is sent when a job being scheduled or a running job instance is manually stopped.

                                                              If a user except the job executor cancels a job, a job cancellation alarm notification is sent.

                                                            • Successful rerun of a failed job
                                                              NOTE:

                                                              A notification will be sent after the successful rerun of a failed job only when a failure alarm was sent when the job failed.

                                                            • Job modification

                                                              A notification is sent when a job is modified or deleted, or the script used by the job is modified or deleted by a user except the job owner. If the job owner is empty, no alarm notification will be sent if the job is modified.

                                                            • Busy resources: If the DLI resource queue is busy during job execution, the job execution takes a long time or fails. As a result, an alarm is generated and a notification is sent.
                                                            -
                                                          • When Notification Scope is All jobs, available options for this parameter include:
                                                            • Abnormal: When a job is not running properly or fails, a notification is sent to notify the user of the abnormality.
                                                              You can set Max. Notifications and Min. Notification Interval (min). After a job encounters an exception or fails and before it is recovered, you can send the interval for sending alarm notifications.
                                                              NOTE:

                                                              You can set Max. Notifications to a value from 1 to 50. If the default value 1 is used, Min. Notification Interval (min) is unavailable.

                                                              -

                                                              You can set Min. Notification Interval (min) to a value from 5 to 60.

                                                              -
                                                              -
                                                              -
                                                            • Cancellation: When a job is canceled, a notification is sent.
                                                              NOTE:

                                                              An alarm notification is sent when a job being scheduled or a running job instance is manually stopped.

                                                              -

                                                              If a user except the job executor cancels a job, a job cancellation alarm notification is sent.

                                                              -
                                                              -
                                                            • Successful rerun of a failed job
                                                              NOTE:

                                                              A notification will be sent after the successful rerun of a failed job only when a failure alarm was sent when the job failed.

                                                              -
                                                              -
                                                            • Job modification

                                                              A notification is sent when a job is modified or deleted, or the script used by the job is modified or deleted by a user except the job owner. If the job owner is empty, no alarm notification will be sent if the job is modified.

                                                              -
                                                            • Busy resources: If the DLI resource queue is busy during job execution, the job execution takes a long time or fails. As a result, an alarm is generated and a notification is sent.
                                                          NOTE:
                                                          • For a real-time job, a notification is allowed to be sent only when the real-time job is in the Run abnormally or Failed state. For a batch job, a notification can be sent no matter when the batch job is in the Run normally, Run abnormally, or Failed state.
                                                          • If you choose the default DLI resource queue, you may not be able to obtain the resources needed to perform operations because the queue is busy and other users may preempt resources. If this occurs, you may try again during off-peak hours or create a queue to run your workloads.
                                                          • When a PatchData or test job is successfully executed, no notification is sent to avoid email or SMS bombing. In addition, no notification is sent when a PatchData job instance is recovered.
                                                          • If a job is re-executed and succeeds after it fails, a job instance recovery notification is sent.

                                                          Notification Mode

                                                          +

                                                          Topic Name

                                                          Yes

                                                          +

                                                          Yes

                                                          • By topic
                                                          • By owner
                                                          -

                                                          Topic Name

                                                          -

                                                          Yes

                                                          -

                                                          This parameter is mandatory only when Notification Mode is set to By topic.

                                                          -

                                                          Select a notification topic.

                                                          +

                                                          Select a notification topic.

                                                          Click View Topic to go to the SMN page and view topics.

                                                          NOTE:

                                                          Currently, only SMS, email, or HTTP are supported to subscribe to topics.

                                                          Terminal Protocol

                                                          +

                                                          Notification

                                                          Yes

                                                          +

                                                          Yes

                                                          Before setting this parameter, ensure that a job alarm notification topic has been configured in the workspace default configuration.

                                                          -

                                                          This parameter is mandatory only when Notification Mode is set to By owner.

                                                          -
                                                          • SMS
                                                          • Email
                                                          • Phone

                                                            Click Verify Contact Information to check for the jobs for which no owner information is set.

                                                            -

                                                            Click View Subscription. The Terminal Subscriptions page is displayed, on which you can view the terminal subscriptions that have been configured.

                                                            -
                                                          -

                                                          Cc

                                                          -

                                                          Yes

                                                          -

                                                          This parameter is mandatory only when Notification Mode is set to By owner.

                                                          -

                                                          You can select up to 10 options.

                                                          -

                                                          Notification

                                                          -

                                                          Yes

                                                          -

                                                          Whether to enable the notification function. The function is enabled by default.

                                                          +

                                                          Whether to enable the notification function. The function is enabled by default.

                                                          - @@ -67,7 +67,7 @@ + + + +
                                                          Table 1 Notification parameters

                                                          Parameter

                                                          +
                                                          - - - - - - - - - - - - - - - - - - - - - - - @@ -80,7 +80,14 @@
                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0516.html b/docs/dataartsstudio/umn/dataartsstudio_01_0516.html index c4194366e..f42475235 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0516.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0516.html @@ -3,11 +3,11 @@

                                                          Managing Backups

                                                          You can back up all jobs, scripts, resources, and environment variables at a specified interval.

                                                          You can also restore assets that have been backed up, including jobs, scripts, resources, and environment variables.

                                                          -

                                                          Constraints

                                                          This function depends on OBS.

                                                          +

                                                          Constraints

                                                          • This function depends on OBS.
                                                          • Backup files cannot be automatically aged. You need to manually delete backup files on a regular basis.

                                                          Prerequisites

                                                          OBS has been enabled and a folder has been created in OBS.

                                                          -

                                                          Backing Up Assets

                                                          1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          2. In the navigation tree on the left, choose Manage Backup.

                                                            +

                                                            Backing Up Assets

                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                            2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            3. In the navigation tree on the left, choose Manage Backup.

                                                            4. Click Start Daily Backup. In the Browse OBS File dialog box, select an OBS folder.

                                                              • Daily Backup starts at 00:00 every day to back up all jobs, scripts, resources, and environment variables of the previous day. The jobs, scripts, resources, and environment variables of the previous day are not backed up on the current day.
                                                              • If you select only the bucket name as the OBS storage path, the backup object is automatically stored in the folder named after the backup date. Environment variables, resources, scripts, and jobs are stored in the 1_env, 2_resources, 3_scripts, and 4_jobs folders, respectively.
                                                              • After the backup is successful, the backup.json file is automatically generated in the folder named after the backup date. The file stores job information based on the node type and can be modified before job restoration.
                                                              • To stop daily backup, click Stop Daily Backup.
                                                              @@ -16,7 +16,7 @@

                                                              Restoring Assets

                                                              1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              2. In the navigation tree of the DataArts Factory console, choose Manage Backup.
                                                              3. On the Manage Restoration tab, click Restore Backup.

                                                                In the Restore Backup dialog box, select the storage path of the asset to be restored from the OBS bucket and set the duplicate name policy.

                                                                • The storage path is the file path generated in Backing Up Assets.
                                                                • Before restoring assets, you can modify the backup.json file in the backup path. You can change the connection name (connectionName), database name (database), and cluster name (clusterName).
                                                                -
                                                                Figure 1 Restoring assets
                                                                +
                                                                Figure 1 Restoring assets

                                                              4. Click OK.
                                                              @@ -27,3 +27,10 @@
                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0519.html b/docs/dataartsstudio/umn/dataartsstudio_01_0519.html index 35a053c2b..1bb41f4e6 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0519.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0519.html @@ -6,21 +6,21 @@

                                                          Constraints

                                                          This function depends on OBS or MRS HDFS.

                                                          (Optional) Creating a Directory

                                                          If a directory exists, you do not need to create one.

                                                          -
                                                          1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          2. In the left navigation pane, choose Configuration > Manage Resource.
                                                          3. In the directory list, click . In the displayed dialog box, configure directory parameters. Table 1 describes the directory parameters. -
                                                          Table 1 Notification parameters

                                                          Parameter

                                                          Mandatory

                                                          +

                                                          Mandatory

                                                          Description

                                                          +

                                                          Description

                                                          Notification Name

                                                          +

                                                          Notification Name

                                                          Yes

                                                          +

                                                          Yes

                                                          Name of the notification to be sent.

                                                          +

                                                          Name of the notification to be sent.

                                                          Cycle

                                                          +

                                                          Cycle

                                                          Yes

                                                          +

                                                          Yes

                                                          Interval for sending notifications, which can be set to Daily, Weekly, or Monthly.

                                                          +

                                                          Interval for sending notifications, which can be set to Daily, Weekly, or Monthly.

                                                          NOTE:

                                                          When Cycle is set to Daily, Weekly, or Monthly, a notification is sent every day, week, or month, and the notification content comes from the data generated from the last 24 hours, seven days, or 30 days.

                                                          Select Time

                                                          +

                                                          Select Time

                                                          Yes

                                                          +

                                                          Yes

                                                          This parameter is mandatory when Cycle is set to Weekly or Monthly.

                                                          +

                                                          This parameter is mandatory when Cycle is set to Weekly or Monthly.

                                                          Time when the notification is sent.

                                                          • If Cycle is set to Weekly, the value can be any day or any several days from Monday to Sunday in a week.
                                                          • If Cycle is set to Monthly, the value can be any day or any several days from 1st to 31st in a month.

                                                          Start Time

                                                          +

                                                          Start Time

                                                          Yes

                                                          +

                                                          Yes

                                                          Point in time when the notification is sent. The value can be accurate to hour or minute.

                                                          +

                                                          Point in time when the notification is sent. The value can be accurate to hour or minute.

                                                          Topic Name

                                                          +

                                                          Topic Name

                                                          Yes

                                                          +

                                                          Yes

                                                          Notification topic

                                                          +

                                                          Notification topic

                                                          OBS Bucket

                                                          +

                                                          OBS Bucket

                                                          Yes

                                                          +

                                                          Yes

                                                          OBS bucket for storing notification records

                                                          +

                                                          OBS bucket for storing notification records

                                                          Notification

                                                          +

                                                          Notification

                                                          Yes

                                                          +

                                                          Yes

                                                          Whether to enable the notification function. The function is enabled by default.

                                                          +

                                                          Whether to enable the notification function. The function is enabled by default.

                                                          - + + + +
                                                          Table 1 Resource directory parameters

                                                          Parameter

                                                          +
                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          3. In the left navigation pane, choose Configuration > Manage Resource.
                                                          4. In the directory list, click . In the displayed dialog box, configure directory parameters. Table 1 describes the directory parameters. +
                                                            - - - - - @@ -29,65 +29,65 @@
                                                          5. Click OK.
                                                          6. Creating a Resource

                                                            You have enabled OBS before creating a resource.

                                                            -
                                                            1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            2. In the left navigation pane, choose Configuration > Manage Resource.
                                                            3. Click Create Resource. In the displayed dialog box, configure resource parameters. Table 2 describes the resource parameters. Click OK. -
                                                            Table 1 Resource directory parameters

                                                            Parameter

                                                            Description

                                                            +

                                                            Description

                                                            Directory Name

                                                            +

                                                            Directory Name

                                                            Name of the resource directory. The name must contain 1 to 32 characters, including only letters, numbers, underscores (_), and hyphens (-).

                                                            +

                                                            Name of the resource directory. The name must contain 1 to 32 characters, including only letters, numbers, underscores (_), and hyphens (-).

                                                            Select Directory

                                                            +

                                                            Select Directory

                                                            Parent directory of the resource directory. The parent directory is the root directory by default.

                                                            +

                                                            Parent directory of the resource directory. The parent directory is the root directory by default.

                                                            + + + +
                                                            Table 2 Resource management parameters

                                                            Parameter

                                                            +
                                                            1. In the left navigation pane, choose Configuration > Manage Resource.
                                                            2. Click Create Resource. In the displayed dialog box, configure resource parameters. Table 2 describes the resource parameters. Click OK. +
                                                              - - - - - - - - - - - - - - - - - - - - - - - @@ -96,22 +96,22 @@

                                                              Editing a Resource

                                                              After a resource is created, you can modify resource parameters.

                                                              -
                                                              1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              2. In the left navigation pane, choose Configuration > Manage Resource.
                                                              3. In the Operation column of the resource, click Edit. In the displayed dialog box, modify the resource parameters. For details, see Table 2.
                                                              4. Click OK.
                                                              +
                                                              1. In the left navigation pane, choose Configuration > Manage Resource.
                                                              2. In the Operation column of the resource, click Edit. In the displayed dialog box, modify the resource parameters. For details, see Table 2.
                                                              3. Click OK.

                                                              Deleting a Resource

                                                              You can delete resources that are no longer needed.

                                                              Before deleting a resource, ensure that it is not used by any jobs.

                                                              If you are trying to delete a resource that is being used by jobs, the Delete Resource dialog box is displayed. When you click OK, the Reference List dialog box is displayed, in which you can view the jobs that are using the resource and click View in the Operation column to go to the job details page.

                                                              -
                                                              1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              2. In the left navigation pane, choose Configuration > Manage Resource.
                                                              3. In the Operation column of the resource, click Delete. The Delete Resource dialog box is displayed.
                                                              4. Click Yes.
                                                              +
                                                              1. In the left navigation pane, choose Configuration > Manage Resource.
                                                              2. In the Operation column of the resource, click Delete. The Delete Resource dialog box is displayed.
                                                              3. Click Yes.

                                                              Importing a Resource

                                                              To import a resource, perform the following operations:

                                                              -
                                                              1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              2. In the left navigation pane, choose Configuration > Manage Resource.
                                                              3. In the resource directory, click and select Import Resource. The Import Resource dialog box is displayed.
                                                              4. Select the resource file that has been uploaded to OBS and click Next. After the import is complete, click Close.
                                                              +
                                                              1. In the left navigation pane, choose Configuration > Manage Resource.
                                                              2. In the resource directory, click and select Import Resource. The Import Resource dialog box is displayed.
                                                              3. Select the resource file that has been uploaded to OBS and click Next. After the import is complete, click Close.

                                                              Exporting a Resource

                                                              To export a resource, perform the following operations:

                                                              -
                                                              1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              2. In the left navigation pane, choose Configuration > Manage Resource.
                                                              3. In the resource directory, select a resource, click , and select Export Resource. The system starts downloading the resource to the local PC.
                                                              +
                                                              1. In the left navigation pane, choose Configuration > Manage Resource.
                                                              2. In the resource directory, select a resource, click , and select Export Resource. The system starts downloading the resource to the local PC.

                                                              Viewing Resource References

                                                              To view the references of a resource, perform the following operations:

                                                              -
                                                              1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              2. In the left navigation pane, choose Configuration > Manage Resource.
                                                              3. Right-click a resource in the list and select View Reference.
                                                              4. In the displayed Reference List dialog box, view the references of the resource.

                                                                +
                                                                1. In the left navigation pane, choose Configuration > Manage Resource.
                                                                2. Right-click a resource in the list and select View Reference.
                                                                3. In the displayed Reference List dialog box, view the references of the resource.

                                                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0521.html b/docs/dataartsstudio/umn/dataartsstudio_01_0521.html index 571b8b188..c66e28079 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0521.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0521.html @@ -9,15 +9,15 @@

                                                              Preparations

                                                              • Object Storage Service (OBS) has been enabled and a bucket, for example, obs://dlfexample, has been created for storing the JAR package of the Spark job.
                                                              • DLI has been enabled, and the Spark cluster spark_cluster has been created for providing physical resources required for the Spark job.

                                                              Obtaining Spark Job Code

                                                              The Spark job code used in this example comes from the maven repository that can be download from https://repo.maven.apache.org/maven2/org/apache/spark/spark-examples_2.10/1.1.1/spark-examples_2.10-1.1.1.jar. This Spark job is to calculate the approximate value of π.

                                                              -
                                                              1. After obtaining the JAR package of the Spark job codes, upload it to the OBS bucket. The save path is obs://dlfexample/spark-examples_2.10-1.1.1.jar.
                                                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              3. In the navigation tree on the left, choose Configuration > Manage Resource. Click Create Resource and create resource spark-example on DataArts Factory and associate it with the JAR package obtained in 1.

                                                                Figure 1 Creating a resource
                                                                +
                                                                1. After obtaining the JAR package of the Spark job codes, upload it to the OBS bucket. The save path is obs://dlfexample/spark-examples_2.10-1.1.1.jar.
                                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                3. In the navigation tree on the left, choose Configuration > Manage Resource. Click Create Resource and create resource spark-example on DataArts Factory and associate it with the JAR package obtained in 1.

                                                                  Figure 1 Creating a resource

                                                              Submitting a Spark Job

                                                              You need to create a job on DataArts Factory and submit the Spark job using the DLI Spark node of the job.

                                                              -
                                                              1. Create a job named job_DLI_Spark for the DataArts Factory module.

                                                                Figure 2 Creating a job
                                                                -

                                                              2. Go to the job development page, drag the DLI Spark node to the canvas, and click the node to configure node properties.

                                                                Figure 3 Configuring node properties
                                                                +
                                                                1. Create a job named job_DLI_Spark for the DataArts Factory module.

                                                                  Figure 2 Creating a job
                                                                  +

                                                                2. Go to the job development page, drag the DLI Spark node to the canvas, and click the node to configure node properties.

                                                                  Figure 3 Configuring node properties

                                                                  Description of key properties:

                                                                  • DLI Queue: Select a DLI queue.
                                                                  • Job Running Resource: Maximum CPU and memory resources that can be used when a DLI Spark node is running.
                                                                  • Major Job Class: major class of a DLI Spark node. In this example, the major class is org.apache.spark.examples.SparkPi.
                                                                  • Spark program resource package: Select the resources created in 3.
                                                                  -

                                                                3. After the job orchestration is complete, click to test the job.

                                                                  Figure 4 Job logs (for reference only)
                                                                  +

                                                                4. After the job orchestration is complete, click to test the job.

                                                                  Figure 4 Job logs (for reference only)

                                                                5. If no error is recorded in logs, save and submit the job.
                                                              @@ -27,3 +27,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0522.html b/docs/dataartsstudio/umn/dataartsstudio_01_0522.html index 3fe764eb8..472eb7ea6 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0522.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0522.html @@ -8,22 +8,21 @@
                                                            3. Cloud Data Migration (CDM) has been enabled. A CDM cluster has been created for providing an agent for communication between DataArts Factory and MRS.

                                                              Ensure that the VPC, subnet, and security group of the CDM cluster are the same as those of the MRS cluster so that the two clusters can communicate with each other.

                                                            4. -

                                                              Creating a Hive Data Connection

                                                              Before developing a Hive SQL script, you must create a data connection to MRS Hive on the Manage Data Connections page of Management Center. The data connection name is hive1009.

                                                              +

                                                              Creating a Hive Data Connection

                                                              Before developing a Hive SQL script, you must create a data connection to MRS Hive on the Manage Data Connections page of Management Center. The data connection name is hive1009. For how to create an MRS Hive connection, see MRS Hive Connection Parameters.

                                                              Description of key parameters:

                                                              • Cluster Name: Enter the name of the created MRS cluster.
                                                              • Agent: Select the created CDM cluster.

                                                              Developing a Hive SQL Script

                                                              Choose Development > Develop Script and create a Hive SQL script named hive_sql. Then enter SQL statements in the editor to fulfill business requirements.

                                                              -
                                                              Figure 1 Developing a script
                                                              +
                                                              Figure 1 Developing a script

                                                              Notes:

                                                              • The script development area in Figure 1 is a temporary debugging area. After you close the tab page, the development area will be cleared. You can click Submit to save and submit a script version.
                                                              • Data Connection: Connection created in Creating a Hive Data Connection.

                                                              Developing a Hive SQL Job

                                                              After the Hive SQL script is developed, build a periodically deducted job for the Hive SQL script so that the script can be executed periodically.

                                                              -
                                                              1. Create an empty DataArts Factory job named job_hive_sql.

                                                                Figure 2 Creating a job named job_hive_sql
                                                                -

                                                              2. Go to the job development page, drag the MRS Hive SQL node to the canvas, and click the node to configure node properties.

                                                                Figure 3 Configuring properties for an MRS Hive SQL node
                                                                +
                                                                1. Create an empty DataArts Factory job named job_hive_sql.

                                                                  Figure 2 Creating a job named job_hive_sql
                                                                  +

                                                                2. Go to the job development page, drag the MRS Hive SQL node to the canvas, and click the node to configure node properties.

                                                                  Figure 3 Configuring properties for an MRS Hive SQL node

                                                                  Description of key properties:

                                                                  -
                                                                  • SQL Script: Hive SQL script hive_sql that is developed in Developing a Hive SQL Script.
                                                                  • Data Connection: Data connection that is configured in the SQL script hive_sql is selected by default. The value can be changed.
                                                                  • Database: Database that is configured in the SQL script hive_sql and is selected by default. The value can be changed.
                                                                  • Node Name: Name of the SQL script hive_sql by default. The value can be changed.
                                                                  -

                                                                3. After configuring the job, click to test it.
                                                                4. If the job runs successfully, click the blank area on the canvas and configure the job scheduling policy on the scheduling configuration page on the right.

                                                                  Figure 4 Configuring the scheduling mode
                                                                  -

                                                                  +
                                                                  • Node Name: Name of the SQL script hive_sql by default. The value can be changed.
                                                                  • SQL Script: Hive SQL script hive_sql that is developed in Developing a Hive SQL Script.
                                                                  • Data Connection: Data connection that is configured in the SQL script hive_sql is selected by default. The value can be changed.
                                                                  • Database: Database that is configured in the SQL script hive_sql and is selected by default. The value can be changed.
                                                                  +

                                                                5. After configuring the job, click to test it.
                                                                6. If the job runs successfully, click the blank area on the canvas and configure the job scheduling policy on the scheduling configuration page on the right.

                                                                  Figure 4 Configuring the scheduling mode

                                                                  The job is executed at 02:00 every day from Jan 1, 2021 to Jan 25, 2021.

                                                                7. Click Submit and Execute. The job will be automatically executed every day.
                                                                @@ -35,3 +34,10 @@
                                                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0524.html b/docs/dataartsstudio/umn/dataartsstudio_01_0524.html index 233a4d965..5cffc0b0d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0524.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0524.html @@ -7,7 +7,7 @@

                                                              Preparing the Environment

                                                              • Enable DWS and create a DWS cluster for running DWS SQL jobs.
                                                              • Enable a CDM incremental package. Create a CDM cluster.

                                                                Ensure that the VPC, subnet, and security group of the CDM cluster are the same as those of the DWS cluster so that the two clusters can communicate with each other.

                                                              -

                                                              Creating a DWS Data Connection

                                                              Before developing a DWS SQL job, you must create a data connection to DWS on the Manage Data Connections page of Management Center. The data connection name is dws_link.

                                                              +

                                                              Creating a DWS Data Connection

                                                              Before developing a DWS SQL job, you must create a data connection to DWS on the Manage Data Connections page of Management Center. The data connection name is dws_link. For how to create a DWS connections, see DWS Connection Parameters.

                                                              The key parameters are as follows:

                                                              • Cluster Name: Select the DWS cluster you have created when preparing the environment.
                                                              • Agent: Select the CDM cluster you have created when preparing the environment.
                                                              @@ -32,16 +32,16 @@ CREATE TABLE trade_report trade_total INTEGER(8) );

                                                              Developing a DWS SQL Script

                                                              Choose Development > Develop Script and create a DWS SQL script named dws_sql. Enter an SQL statement in the editor to collect the sales amount of the previous day.

                                                              -
                                                              Figure 1 Developing a script
                                                              +
                                                              Figure 1 Developing a script

                                                              Key notes:

                                                              • The script development area in Figure 1 is a temporary debugging area. After you close the script tab, the development area will be cleared. You can click Submit to save and submit a script version.
                                                              • Connection: Select the data connection created in Creating a DWS Data Connection.

                                                              Developing a DWS SQL Job

                                                              After developing the DWS SQL script, create a job for periodically executing the DWS SQL script.

                                                              -
                                                              1. Create a batch job named job_dws_sql.
                                                              2. Go to the job development page, drag the DWS SQL node to the canvas, and click the node to configure its properties.

                                                                Figure 2 Configuring properties for the DWS SQL node
                                                                +
                                                                1. Create a batch job named job_dws_sql.
                                                                2. Go to the job development page, drag the DWS SQL node to the canvas, and click the node to configure its properties.

                                                                  Figure 2 Configuring properties for the DWS SQL node

                                                                  Key properties:

                                                                  • SQL script: Associate with the dws_sql script developed in Developing a DWS SQL Script.
                                                                  • Data Connection: Select the data connection configured in the dws_sql script. The data connection can be changed.
                                                                  • Database: Select the database configured in the dws_sql script. The database can be changed.
                                                                  • Script Parameter: Obtain the value of yesterday using the following EL expression:
                                                                    #{Job.getYesterday("yyyy-MM-dd")}
                                                                  • Node Name: The name of the dws_sql script is displayed by default. The name can be changed.
                                                                  -

                                                                3. After configuring the job, click to test it.
                                                                4. If the test is successful, click the blank area on the canvas and then the Scheduling Setup tab on the right. On the displayed page, configure the scheduling policy.

                                                                  Figure 3 Configuring the scheduling policy
                                                                  +

                                                                5. After configuring the job, click to test it.
                                                                6. If the test is successful, click the blank area on the canvas and then the Scheduling Setup tab on the right. On the displayed page, configure the scheduling policy.

                                                                  Figure 3 Configuring the scheduling policy

                                                                  Parameter descriptions:

                                                                  From Aug 6 to Aug 31 in 2021, the job was executed once at 02:00 every day.

                                                                  @@ -54,3 +54,10 @@ CREATE TABLE trade_report
                                                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0525.html b/docs/dataartsstudio/umn/dataartsstudio_01_0525.html index bdb824ad4..773a286f8 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0525.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0525.html @@ -36,13 +36,13 @@ if __name__ == "__main__": sc.stop()

                                                              The encoding format must be set to UTF-8. Otherwise, an error will occur during script execution.

                                                              -
                                                            5. Prepare the data file in.txt, which contains some English words.
                                                            6. +
                                                            7. Prepare the data file in.txt, which contains some English words.
                                                            8. Procedure

                                                              -
                                                              1. Upload the script and data file to the OBS bucket.

                                                                Figure 1 Uploading files to an OBS bucket
                                                                +
                                                                1. Upload the script and data file to the OBS bucket.

                                                                  Figure 1 Uploading files to an OBS bucket

                                                                  In this example, upload wordcount.py and in.txt to obs://obs-tongji/python/.

                                                                  -

                                                                2. Create an empty job named job_MRS_Spark_Python.

                                                                  Figure 2 Creating a job
                                                                  -

                                                                3. Go to the job development page, drag the MRS Spark Python node to the canvas, and click the node to configure its properties.

                                                                  Figure 3 Configuring properties for an MRS Spark Python node
                                                                  +

                                                                4. Create an empty job named job_MRS_Spark_Python.

                                                                  Figure 2 Creating a job
                                                                  +

                                                                5. Go to the job development page, drag the MRS Spark Python node to the canvas, and click the node to configure its properties.

                                                                  Figure 3 Configuring properties for an MRS Spark Python node

                                                                  Parameter descriptions:

                                                                  --master
                                                                   yarn
                                                                  @@ -55,12 +55,11 @@ obs://obs-tongji/python/out

                                                                  obs://obs-tongji/python/wordcount.py is the directory where the script is stored.

                                                                  obs://obs-tongji/python/in.txt is the directory where the wordcount.py parameters are passed. You can pass the words to count.

                                                                  obs://obs-tongji/python/out is the directory where output parameters are stored. This directory will also be created in the OBS bucket automatically. If the out directory already exists in the OBS bucket, an error will occur.

                                                                  -

                                                                6. Click Test to execute the script job.
                                                                7. After the test is complete, click Submit.
                                                                8. Choose Monitor Job in the navigation pane and view the job execution result.

                                                                  Figure 4 Viewing the job execution result
                                                                  +

                                                                9. Click Test to execute the script job.
                                                                10. After the test is complete, click Submit.
                                                                11. Choose Monitor Job in the navigation pane and view the job execution result.

                                                                  Figure 4 Viewing the job execution result

                                                                  The job log shows that the job was successfully executed.

                                                                  -
                                                                  Figure 5 Job run logs
                                                                  -
                                                                  Figure 6 Job execution status
                                                                  -

                                                                12. View the returned records in the OBS bucket. (Skip this step if the return function is not configured.)

                                                                  Figure 7 Viewing the returned records in the OBS bucket
                                                                  -

                                                                  +
                                                                  Figure 5 Job run logs
                                                                  +
                                                                  Figure 6 Job execution status
                                                                  +

                                                                13. View the returned records in the OBS bucket. (Skip this step if the return function is not configured.)

                                                                  Figure 7 Viewing the returned records in the OBS bucket

                                                                Case 2: Using an MRS Spark Python Job to Print hello python

                                                                Prerequisites

                                                                You have the permission to access OBS paths.

                                                                @@ -79,9 +78,9 @@ yarn cluster obs://obs-tongji/python/zt_test_sparkPython1.py

                                                                zt_test_sparkPython1.py indicates the directory where the script is stored.

                                                                -

                                                              2. Click Test to execute the script job.
                                                              3. After the test is complete, click Submit.
                                                              4. Choose Monitor Job in the navigation pane and view the job execution result.

                                                                Figure 8 Viewing the job execution result
                                                                +

                                                              5. Click Test to execute the script job.
                                                              6. After the test is complete, click Submit.
                                                              7. Choose Monitor Job in the navigation pane and view the job execution result.

                                                                Figure 8 Viewing the job execution result

                                                              8. Verify the log.

                                                                Log in to MRS Manager and check that the log on YARN contains hello python.

                                                                -
                                                                Figure 9 Viewing logs on YARN
                                                                +
                                                                Figure 9 Viewing logs on YARN

                                                              @@ -91,3 +90,10 @@ obs://obs-tongji/python/zt_test_sparkPython1.py + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0528.html b/docs/dataartsstudio/umn/dataartsstudio_01_0528.html new file mode 100644 index 000000000..ed7887a11 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0528.html @@ -0,0 +1,209 @@ + + +

                                                              MRS ClickHouse

                                                              +

                                                              Functions

                                                              The MRS ClickHouse node is used to execute the ClickHouse SQL script predefined in DataArts Factory.

                                                              +
                                                              +

                                                              Parameters

                                                              Table 1, Table 2, and Table 3 describe the parameters of the MRS ClickHouse node.

                                                              + +
                                                              Table 2 Resource management parameters

                                                              Parameter

                                                              Mandatory

                                                              +

                                                              Mandatory

                                                              Description

                                                              +

                                                              Description

                                                              Name

                                                              +

                                                              Name

                                                              Yes

                                                              +

                                                              Yes

                                                              Name of the resource. The name must contain 1 to 32, including only letters, numbers, underscores (_), and hyphens (-).

                                                              +

                                                              Name of the resource. The name must contain 1 to 32, including only letters, numbers, underscores (_), and hyphens (-).

                                                              Type

                                                              +

                                                              Type

                                                              Yes

                                                              +

                                                              Yes

                                                              File type of the resource. Possible values:

                                                              +

                                                              File type of the resource. Possible values:

                                                              • jar: JAR file
                                                              • pyFile: User Python file
                                                              • file: User file
                                                              • archive: User AI model file The supported file name extensions are zip, tgz, tar.gz, tar, and jar.

                                                              Resource Location

                                                              +

                                                              Resource Location

                                                              Yes

                                                              +

                                                              Yes

                                                              Location of the resource. OBS and HDFS are supported. HDFS supports only MRS Spark, MRS Flink Job and MRS MapReduce nodes.

                                                              +

                                                              Location of the resource. OBS and HDFS are supported. HDFS supports only MRS Spark, MRS Flink Job and MRS MapReduce nodes.

                                                              File Path

                                                              +

                                                              File Path

                                                              Yes

                                                              +

                                                              Yes

                                                              Select an OBS file path when Resource Location is set to OBS.

                                                              +

                                                              Select an OBS file path when Resource Location is set to OBS.

                                                              Select an MRS cluster name when Resource Location is set to HDFS.

                                                              Depended Package

                                                              +

                                                              Depended Package

                                                              No

                                                              +

                                                              No

                                                              This parameter is available only for DLI Spark nodes.

                                                              +

                                                              This parameter is available only for DLI Spark nodes.

                                                              Depended JAR package that has been uploaded to OBS. This parameter is required when Type is set to jar or pyFile.

                                                              Select Directory

                                                              +

                                                              Select Directory

                                                              Yes

                                                              +

                                                              Yes

                                                              Directory to which the resource belongs. The root directory is selected by default.

                                                              +

                                                              Directory to which the resource belongs. The root directory is selected by default.

                                                              Description

                                                              +

                                                              Description

                                                              No

                                                              +

                                                              No

                                                              Descriptive information about the resource.

                                                              +

                                                              Descriptive information about the resource.

                                                              + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                              Table 1 Parameters of MRS ClickHouse nodes

                                                              Parameter

                                                              +

                                                              Mandatory

                                                              +

                                                              Description

                                                              +

                                                              Node Name

                                                              +

                                                              Yes

                                                              +

                                                              Name of a node. The name must contain 1 to 128 characters, including only letters, numbers, underscores (_), hyphens (-), slashes (/), less-than signs (<), and greater-than signs (>).

                                                              +

                                                              By default, the node name is the same as that of the selected script. If you want the node name to be different from the script name, disable this function by referring to Disabling Auto Node Name Change.

                                                              +

                                                              SQL Script

                                                              +

                                                              Yes

                                                              +

                                                              Path of a script to be executed. If no script is available, create and develop a script by referring to Creating a Script and Developing an SQL Script.

                                                              +

                                                              Script Parameter

                                                              +

                                                              No

                                                              +

                                                              If the associated SQL script uses a parameter, the parameter name is displayed. Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.

                                                              +

                                                              If the parameters of the associated SQL script are changed, click to refresh the parameters.

                                                              +

                                                              Data Connection

                                                              +

                                                              Yes

                                                              +

                                                              Data connection that is configured in the SQL script. The value can be changed.

                                                              +

                                                              Database

                                                              +

                                                              Yes

                                                              +

                                                              Database that is configured in the SQL script. The value can be changed.

                                                              +

                                                              Program Parameter

                                                              +

                                                              No

                                                              +

                                                              Used to configure optimization parameters such as threads, memory, and vCPUs for the job to optimize resource usage and improve job execution performance.

                                                              +
                                                              NOTE:

                                                              This parameter is mandatory if the cluster version is MRS 1.8.7 or later than MRS 2.0.1.

                                                              +
                                                              +
                                                              +
                                                              + +
                                                              + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                              Table 2 Advanced parameters

                                                              Parameter

                                                              +

                                                              Mandatory

                                                              +

                                                              Description

                                                              +

                                                              Node Status Polling Interval (s)

                                                              +

                                                              Yes

                                                              +

                                                              How often the system check completeness of the node. The value ranges from 1 to 60 seconds.

                                                              +

                                                              Max. Node Execution Duration

                                                              +

                                                              Yes

                                                              +

                                                              Execution timeout interval for the node. If retry is configured and the execution is not complete within the timeout interval, the node will be executed again.

                                                              +

                                                              Retry upon Failure

                                                              +

                                                              Yes

                                                              +

                                                              Whether to re-execute a node if it fails to be executed. Possible values:

                                                              +
                                                              • Yes: The node will be re-executed, and the following parameters must be configured:
                                                                • Retry upon Timeout
                                                                • Maximum Retries
                                                                • Retry Interval (seconds)
                                                                +
                                                              • No: The node will not be re-executed. This is the default setting.
                                                                NOTE:

                                                                If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                                +

                                                                If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                                +

                                                                Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                                                +
                                                                +
                                                              +

                                                              Policy for Handling Subsequent Nodes If the Current Node Fails

                                                              +

                                                              Yes

                                                              +

                                                              Operation that will be performed if the node fails to be executed. Possible values:

                                                              +
                                                              • Suspend execution plans of the subsequent nodes: stops running subsequent nodes. The job instance status is Failed.
                                                              • End the current job execution plan: stops running the current job. The job instance status is Failed.
                                                              • Go to the next node: ignores the execution failure of the current node. The job instance status is Failure ignored.
                                                              • Suspend the current job execution plan: If the current job instance is in abnormal state, the subsequent nodes of this node and the subsequent job instances that depend on the current job are in waiting state.
                                                              +

                                                              Enable Dry Run

                                                              +

                                                              No

                                                              +

                                                              If you select this option, the node will not be executed, and a success message will be returned.

                                                              +

                                                              Task Groups

                                                              +

                                                              No

                                                              +

                                                              Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                              +
                                                              +
                                                              + +
                                                              + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                              Table 3 Lineage

                                                              Parameter

                                                              +

                                                              Description

                                                              +

                                                              Input

                                                              +

                                                              Add

                                                              +

                                                              Click Add. In the Type drop-down list, select the type to be created. The value can be DWS, OBS, CSS, HIVE, DLI, or CUSTOM.

                                                              +

                                                              OK

                                                              +

                                                              Click OK to save the parameter settings.

                                                              +

                                                              Cancel

                                                              +

                                                              Click Cancel to cancel the parameter settings.

                                                              +

                                                              Modify

                                                              +

                                                              Click to modify the parameter settings. After the modification, save the settings.

                                                              +

                                                              Delete

                                                              +

                                                              Click to delete the parameter settings.

                                                              +

                                                              View Details

                                                              +

                                                              Click to view details about the table created based on the input lineage.

                                                              +

                                                              Output

                                                              +

                                                              Add

                                                              +

                                                              Click Add. In the Type drop-down list, select the type to be created. The value can be DWS, OBS, CSS, HIVE, DLI, or CUSTOM.

                                                              +

                                                              OK

                                                              +

                                                              Click OK to save the parameter settings.

                                                              +

                                                              Cancel

                                                              +

                                                              Click Cancel to cancel the parameter settings.

                                                              +

                                                              Modify

                                                              +

                                                              Click to modify the parameter settings. After the modification, save the settings.

                                                              +

                                                              Delete

                                                              +

                                                              Click to delete the parameter settings.

                                                              +

                                                              View Details

                                                              +

                                                              Click to view details about the table created based on the output lineage.

                                                              +
                                                              +
                                                              + + +
                                                              + +
                                                              + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0529.html b/docs/dataartsstudio/umn/dataartsstudio_01_0529.html index be288f1cf..653aa9bd4 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0529.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0529.html @@ -2,16 +2,16 @@

                                                              Developing a Python Job

                                                              This section describes how to develop and execute a Python job using DataArts Factory.

                                                              -

                                                              Preparing the Environment

                                                              • An ECS named ecs-dgc has been created.

                                                                In this example, the ECS uses the CentOS 8.0 64bit with ARM (40 GB) public image and the Python environment. You can log in to the ECS and run the python command to check the Python environment.

                                                                -

                                                                +

                                                                Preparing the Environment

                                                                • An ECS named ecs-dgc has been created.

                                                                  In this example, the ECS uses the CentOS 8.0 64bit with ARM (40 GB) public image and the Python environment. You can log in to the ECS and run the python command to check the Python environment.

                                                                  +

                                                                  -
                                                                • You have enabled the DataArts Migration incremental package and created a CDM cluster named cdm-dlfpyhthon. The cluster provides an agent for the DataArts Factory module to communicate with the ECS.
                                                                • Ensure that the ECS can communicate with the CDM cluster, which depends on the following conditions:
                                                                  • If the CDM cluster and the ECS are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                                  • If the CDM cluster and the ECS are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, the host where the data source is located can access the Internet, and the port has been enabled in the firewall rules.
                                                                  • The ECS and the CDM cluster belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                                  +
                                                                • You have enabled the DataArts Migration incremental package and created a CDM cluster named cdm-dlfpyhthon. The cluster provides an agent for the DataArts Factory module to communicate with the ECS.
                                                                • Ensure that the ECS can communicate with the CDM cluster, which depends on the following conditions:
                                                                  • If the CDM cluster and the ECS are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                                  • If the CDM cluster and the ECS are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, the host where the data source is located can access the Internet, and the port has been enabled in the firewall rules.
                                                                  • The ECS and the CDM cluster belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.

                                                                Constraints

                                                                • Python nodes support script parameters and job parameters.
                                                                • This section uses Python3 as an example.

                                                                Creating an ECS Data Connection

                                                                Before developing a Python script, you need to create a connection to the ECS.

                                                                -
                                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                                3. On the displayed Manage Data Connections page, click Create Data Connection.
                                                                4. Configure parameters by referring to Table 1 and create a data connection named ecs.

                                                                  +

                                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                  2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                                  3. On the displayed Manage Data Connections page, click Create Data Connection.
                                                                  4. Configure parameters by referring to Table 1 and create a data connection named ecs.

                                                                    - @@ -85,7 +84,9 @@ - @@ -148,7 +149,7 @@

                                                                  5. Click Test to test connectivity of the data connection. If the test fails, the data connection cannot be created.
                                                                  6. After the test is successful, click OK to create the data connection.
                                                                  7. -

                                                                    Developing a Python Script

                                                                    1. Choose DataArts Factory > Develop Script and create a Python script named python_test.
                                                                    2. Select a Python version and host connection, and set input parameters as needed.

                                                                      The parameters will be transferred to the Python script when the script is executed. The parameters are separated by spaces, for example, Microsoft Oracle. The parameters must be referenced by the Python script. Otherwise, the parameters are invalid.

                                                                      +

                                                                      Developing a Python Script

                                                                      1. Choose DataArts Factory > Develop Script and create a Python script named python_test.
                                                                      2. Select a Python version (for example, Python 3) and host connection, and set input parameters as needed.

                                                                        The parameters will be transferred to the Python script when the script is executed. The parameters are separated by spaces, for example, Microsoft Oracle. The parameters must be referenced by the Python script. Otherwise, the parameters are invalid.

                                                                      3. Edit Python statements in the editor.

                                                                        This example defines a string template for saving company information and uses the template to output information about different companies.
                                                                        import sys
                                                                         Company_Name1=sys.argv[1]
                                                                        @@ -161,18 +162,18 @@ print(context2)
                                                                        • The script development area in Figure 1 is a temporary debugging area. After you close the script tab, the development area will be cleared.
                                                                        • Connection: Select the data connection created in Creating an ECS Data Connection.
                                                                        -
                                                                        Figure 1 Editing the Python statements
                                                                        +
                                                                        Figure 1 Editing the Python statements

                                                                        -

                                                                      4. Click Save and then Submit.
                                                                      5. Click Execute to execute the Python statements.
                                                                      6. View the script execution result.

                                                                        Figure 2 Viewing the script execution result
                                                                        +

                                                                      7. Click Save and then Submit.
                                                                      8. Click Execute to execute the Python statements.
                                                                      9. View the script execution result.

                                                                        Figure 2 Viewing the script execution result

                                                                      -

                                                                      Referencing the Python Script in a Job

                                                                      1. Create a job.
                                                                      2. Select a Python node and configure the node properties.

                                                                        Select the created Python script and set the node parameters. Set Script Parameters.

                                                                        The parameters will be transferred to the Python statement when the statement is executed. The parameters are separated by spaces, for example, Microsoft Oracle. The parameters must be referenced by the Python statement. Otherwise, the parameters are invalid.

                                                                        +

                                                                        Referencing the Python Script in a Job

                                                                        1. Create a job.
                                                                        2. Select a Python node and configure the node properties.

                                                                          Select the created Python script and set the node parameters. Set Script Parameters.

                                                                          The parameters will be transferred to the Python statement when the statement is executed. The parameters are separated by spaces, for example, Microsoft Oracle. The parameters must be referenced by the Python statement. Otherwise, the parameters are invalid.

                                                                          -
                                                                          Figure 3 Configuring properties of the Python node
                                                                          +
                                                                          Figure 3 Configuring properties of the Python node

                                                                          -

                                                                        3. Click Test and view the job running result.

                                                                          Figure 4 Checking the job execution result
                                                                          +

                                                                        4. Click Test and view the job running result.

                                                                          Figure 4 Checking the job execution result

                                                                        5. Click Save. The job configuration is complete.
                                                                        6. Click Submit. After a version is submitted, the job can be scheduled.
                                                                        @@ -183,3 +184,10 @@ print(context2)
                                                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0530.html b/docs/dataartsstudio/umn/dataartsstudio_01_0530.html index 5ac68ab18..a5f340478 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0530.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0530.html @@ -1,24 +1,31 @@

                                                                        (Optional) Changing the Job Log Storage Path

                                                                        -

                                                                        By default, job logs and DLI dirty data are stored in an OBS bucket named dlf-log-{project ID}. You can customize a log storage path. You can configure an OBS bucket globally based on the workspace.

                                                                        -

                                                                        Constraints

                                                                        • This function depends on the OBS service.
                                                                        • The OBS path is only supported for OBS buckets and not for parallel file systems.
                                                                        +

                                                                        By default, job logs and DLI dirty data are stored in an OBS bucket named dlf-log-{project ID}. You can customize a storage path for logs and one for DLI dirty data. You can also configure an OBS bucket globally based on the workspace.

                                                                        +

                                                                        Notes and Constraints

                                                                        • This function depends on the OBS service.
                                                                        • The OBS path is only supported for OBS buckets and not for parallel file systems.
                                                                        -

                                                                        Prerequisites

                                                                        You have changed your account to either of the following:
                                                                        • DARTS Administrator or Tenant Administrator
                                                                        • DARTS User, which is the workspace administrator
                                                                        +

                                                                        Prerequisites

                                                                        You are using either of the following accounts:
                                                                        • DARTS Administrator or Tenant Administrator
                                                                        • DARTS User, which is the administrator of the current workspace
                                                                        -

                                                                        Procedure

                                                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                        2. On the Workspaces page, locate the target workspace and click Edit in the Operation column.

                                                                          Figure 1 Workspace Information dialog box
                                                                          -

                                                                          -

                                                                          -

                                                                        3. In the Workspace Information dialog box, click Select next to Job Log Path and Dirty Data Path to select the path for storing logs and DLI dirty data. You can select a specific directory.

                                                                          Figure 2 Changing the path for storing logs and DLI dirty data
                                                                          +

                                                                          Procedure

                                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                          2. On the Workspaces page, locate the target workspace and click Edit in the Operation column.

                                                                            Figure 1 Workspace Information dialog box
                                                                            +

                                                                            +

                                                                            +

                                                                          3. In the Workspace Information dialog box, click Select next to Job Log Path and Dirty Data Path and select a path.

                                                                            Figure 2 Changing the job log path and DLI dirty data path

                                                                            -

                                                                          4. Click OK.
                                                                          +

                                                                        4. Click OK.
                                                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0532.html b/docs/dataartsstudio/umn/dataartsstudio_01_0532.html index 460061ea5..917d39bad 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0532.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0532.html @@ -2,7 +2,7 @@

                                                                        Managing Job Tags

                                                                        Job tags are used to label jobs of the same or similar purposes to facilitate job management and query. This section describes how to manage job tags, including adding, deleting, importing, and exporting tags.

                                                                        -

                                                                        Adding a Job Tag

                                                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                        2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                        3. In the navigation pane, choose Configuration > Configure.
                                                                        4. Choose Job Tag.
                                                                        5. Click Add. In the displayed dialog box, enter a tag name and click OK.

                                                                          You can add a maximum of 100 job tags.

                                                                          +

                                                                          Adding a Job Tag

                                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                          3. In the navigation pane, choose Configuration > Configure.
                                                                          4. Choose Job Tag.
                                                                          5. Click Add. In the displayed dialog box, enter a tag name and click OK.

                                                                            You can add a maximum of 100 job tags.

                                                                          @@ -12,13 +12,13 @@

                                                                          Monitoring Jobs with a Specified Tag

                                                                          1. In the navigation pane, choose Configuration > Configure.
                                                                          2. Choose Job Tag.
                                                                          3. Locate a tag and click Monitor in the Operation column. The Monitor Job page is displayed, on which all the jobs with the tag are displayed.
                                                                          -

                                                                          Locking and Unlocking a Job Tag

                                                                          To perform these operations, you must have the DARTS Administrator, Tenant Administrator, or workspace administrator permission.

                                                                          +

                                                                          Locking and Unlocking a Job Tag

                                                                          To perform these operations, you must have the DARTS Administrator, Tenant Administrator, or workspace administrator permission.

                                                                          1. In the navigation pane, choose Configuration > Configure.
                                                                          2. Choose Job Tag.
                                                                          3. Locate a tag and click Lock or Unlock in the Operation column.

                                                                            • A locked job tag cannot be deleted.
                                                                            • Importing a locked tag will fail.
                                                                            • A locked tag cannot be added to or removed from a job.
                                                                            • Importing a job with a locked tag will fail.
                                                                            • When a job fails to be imported and a tag needs to be automatically generated, if the tag already exists and is locked, it will not be added to the job.

                                                                          -

                                                                          Importing Job Tags

                                                                          To perform this operation, you must have the DARTS Administrator, Tenant Administrator, or workspace administrator permission.

                                                                          +

                                                                          Importing Job Tags

                                                                          To perform these operations, you must have the Administrator, Tenant Administrator, or workspace administrator permission.

                                                                          1. In the navigation pane, choose Configuration > Configure.
                                                                          2. Choose Job Tag.
                                                                          3. Click Import Job Tag.
                                                                          4. In the displayed dialog box, set the following parameters:

                                                                            • File Location: Select Local or OBS.
                                                                            • Select File from Local/OBS: Select a local path or an OBS bucket path.
                                                                              • You are advised to obtain a file to import by exporting tags. The first row of the file is the tag name, and the first column is the job name. If a job has a specified tag, the value in the corresponding cell is 1. Otherwise, the value is 0. If a cell is empty, the system uses value 0 for the cell.
                                                                              • The maximum size of the file to be imported is 10 MB.
                                                                              • If the file to be imported contains two tags with the same name, and the ID of one tag is 0 and that of the other tag is 1, the system uses 1 as the tag ID.
                                                                              • If the file to be imported contains two jobs with the same name, the system identifies the job in the latter row and uses the tag ID in this row.
                                                                            • Mode: Select Append or Overwrite.
                                                                              • Append: The new tag will not overwrite the existing one.
                                                                              • Overwrite: The new tag will overwrite the existing one.
                                                                              @@ -27,7 +27,7 @@

                                                                          Exporting Job Tags

                                                                          1. In the navigation pane, choose Configuration > Configure.
                                                                          2. Choose Job Tag.
                                                                          3. Export tags.

                                                                            • To export all tags, click Export All Tags above the tag list.
                                                                            • To export some tags, select them and click Export Selected Tags above the tag list.

                                                                            The following figure shows the exported job tags.

                                                                            -
                                                                            Figure 1 Exporting job tags
                                                                            +
                                                                            Figure 1 Exporting job tags
                                                                            • In the exported file, the first row is the tag name, and the first column is the job name. If a job has a specified tag, the value in the corresponding cell is 1. Otherwise, the value is 0.
                                                                            • The first column displays names of all the jobs in the workspace, including real-time job nodes, For Each subjobs, and Subjob subjobs.

                                                                          @@ -39,3 +39,10 @@
                                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0535.html b/docs/dataartsstudio/umn/dataartsstudio_01_0535.html index 53a99ca98..356fe8c5c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0535.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0535.html @@ -90,7 +90,7 @@
                                                                    + + + +
                                                                    Table 1 Host Connection parameters

                                                                    Parameter

                                                                    Mandatory

                                                                    @@ -48,7 +48,6 @@

                                                                    Yes

                                                                    Select the modules for which this connection is available.

                                                                    -

                                                                    All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                                    Basic and Network Connectivity Configuration

                                                                    @@ -66,9 +65,9 @@

                                                                    Yes

                                                                    CDM cluster used as an agent.

                                                                    +

                                                                    CDM cluster used as an agent. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                                    NOTE:
                                                                    • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                                      -
                                                                    • When scheduling shell or Python scripts, the agent accesses the ECS. If shell and Python scripts are scheduled frequently, the ECS adds the private IP address of the agent to the blocklist. To ensure normal job scheduling, you are advised to use the root user of the ECS to add the private IP address bound to the agent (CDM cluster) to the /etc/hosts.allow file.

                                                                      For details about how to obtain the private IP address of the CDM cluster, see Viewing Basic Cluster Information and Modifying Cluster Configurations.

                                                                      +
                                                                    • When scheduling shell or Python scripts, the agent accesses the ECS. If shell and Python scripts are scheduled frequently, the ECS adds the private IP address of the agent to the blocklist. To ensure normal job scheduling, you are advised to use the root user of the ECS to add the private IP address bound to the agent (CDM cluster) to the /etc/hosts.allow file.

                                                                      For details about how to obtain the private IP address of the CDM cluster, see Viewing and Modifying CDM Cluster Configurations.

                                                                    Yes

                                                                    KMS key used to encrypt and decrypt the authentication information for the data source

                                                                    +
                                                                    KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                                    NOTE:
                                                                    • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                                    • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                                    +
                                                                    +

                                                                    Data Source Authentication and Other Function Configuration

                                                                    @@ -111,8 +112,8 @@

                                                                    Yes

                                                                    This parameter is available only when Login Mode is set to Key Pair.

                                                                    -

                                                                    If Key Pair is the login mode of the host, you need to obtain the private key file, upload it to OBS, and select an OBS path.

                                                                    -
                                                                    NOTE:

                                                                    The uploaded private key must match the public key configured on the host. For details, see "Passwords and Key Pairs" > "Key Pairs" > "Application Scenarios for Using Key Pairs" in Elastic Cloud Server User Guide.

                                                                    +

                                                                    If Key Pair is the login mode of the host, you need to obtain the private key file, upload it to OBS, and select an OBS path.

                                                                    +
                                                                    NOTE:

                                                                    The uploaded private key must match the public key configured on the host. For details, see "Passwords and Key Pairs" > "Key Pairs" > "Application Scenarios for Using Key Pairs" in Elastic Cloud Server User Guide.

                                                                    Yes

                                                                    Whether to re-execute a node if it fails to be executed. Possible values:

                                                                    -
                                                                    • Yes: The node will be re-executed, and the following parameters must be configured:
                                                                      • Retry upon Timeout
                                                                      • Maximum Retries
                                                                      • Retry Interval (seconds)
                                                                      +
                                                                      • Yes: The node will be re-executed, and the following parameters must be configured:
                                                                        • Retry upon Timeout
                                                                        • Maximum Retries
                                                                        • Retry Interval (seconds)
                                                                      • No: The node will not be re-executed. This is the default setting.
                                                                        NOTE:

                                                                        If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                                        If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                                        Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                                                        @@ -113,6 +113,13 @@

                                                                    If you select this option, the node will not be executed, and a success message will be returned.

                                                                    Task Groups

                                                                    +

                                                                    No

                                                                    +

                                                                    Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                                    +
                                                                    diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0536.html b/docs/dataartsstudio/umn/dataartsstudio_01_0536.html index 744b64408..aac487f35 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0536.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0536.html @@ -1,6 +1,6 @@ -

                                                                    DLI Flink Job

                                                                    +

                                                                    DLI Flink Job

                                                                    Function

                                                                    The DLI Flink Job node is used to create and start jobs or check whether DLI jobs are running to analyze streaming big data in real time.

                                                                    After a DLI Flink streaming job is submitted to DLI, if the job is in the running state, the node is successfully executed. If periodic scheduling is configured for the job, the system periodically checks whether the Flink job is still in the running state. If the Flink job is in the running state, the node is successfully executed.

                                                                    @@ -90,7 +90,7 @@

                                                            No

                                                            If the associated Flink SQL script uses a parameter, the parameter name is displayed. Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.

                                                            -

                                                            If the parameters of the associated Flink SQL script are changed, click to refresh the parameters.

                                                            +

                                                            If the parameters of the associated Flink SQL script are changed, click to refresh the parameters.

                                                            UDF Jar

                                                            @@ -186,7 +186,7 @@

                                                            No

                                                            If the associated Flink SQL script uses a parameter, the parameter name is displayed. Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.

                                                            -

                                                            If the parameters of the associated Flink SQL script are changed, click to refresh the parameters.

                                                            +

                                                            If the parameters of the associated Flink SQL script are changed, click to refresh the parameters.

                                                            UDF Jar

                                                            @@ -367,7 +367,7 @@

                                                            Yes

                                                            Whether to re-execute a node if it fails to be executed. Possible values:

                                                            -
                                                            • Yes: The node will be re-executed, and the following parameters must be configured:
                                                              • Retry upon Timeout
                                                              • Maximum Retries
                                                              • Retry Interval (seconds)
                                                              +
                                                              • Yes: The node will be re-executed, and the following parameters must be configured:
                                                                • Retry upon Timeout
                                                                • Maximum Retries
                                                                • Retry Interval (seconds)
                                                              • No: The node will not be re-executed. This is the default setting.
                                                                NOTE:

                                                                If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                                If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                                Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                                                @@ -390,6 +390,13 @@

                                                            If you select this option, the node will not be executed, and a success message will be returned.

                                                            Task Groups

                                                            +

                                                            No

                                                            +

                                                            Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                            +
                                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0537.html b/docs/dataartsstudio/umn/dataartsstudio_01_0537.html index 3ed3a9614..cde672387 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0537.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0537.html @@ -24,7 +24,7 @@

                                                          Yes

                                                          Select a topic that has been created in MRS Kafka. The SDK or command line can be used to create a topic.

                                                          +

                                                          Select a topic that has been created in MRS Kafka. The SDK or command line can be used to create a topic. For details, see "Using Kafka from Scratch" in MapReduce Service (MRS) Usage Guide.

                                                          Node Name

                                                          @@ -58,7 +58,7 @@

                                                          Yes

                                                          Whether to re-execute a node if it fails to be executed. Possible values:

                                                          -
                                                          • Yes: The node will be re-executed, and the following parameters must be configured:
                                                            • Retry upon Timeout
                                                            • Maximum Retries
                                                            • Retry Interval (seconds)
                                                            +
                                                            • Yes: The node will be re-executed, and the following parameters must be configured:
                                                              • Retry upon Timeout
                                                              • Maximum Retries
                                                              • Retry Interval (seconds)
                                                            • No: The node will not be re-executed. This is the default setting.
                                                              NOTE:

                                                              If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                              If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                              Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                                              @@ -81,6 +81,13 @@

                                                          If you select this option, the node will not be executed, and a success message will be returned.

                                                          Task Groups

                                                          +

                                                          No

                                                          +

                                                          Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                          +
                                                          diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0538.html b/docs/dataartsstudio/umn/dataartsstudio_01_0538.html index bb9a7316f..d14936a0a 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0538.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0538.html @@ -39,7 +39,7 @@

                                                          Yes

                                                          Text content sent to Kafka. You can directly enter text or click to use the EL expression.

                                                          +

                                                          Text content sent to Kafka. You can directly enter text or click to use the EL expression.

                                                          Yes

                                                          Whether to re-execute a node if it fails to be executed. Possible values:

                                                          -
                                                          • Yes: The node will be re-executed, and the following parameters must be configured:
                                                            • Retry upon Timeout
                                                            • Maximum Retries
                                                            • Retry Interval (seconds)
                                                            +
                                                            • Yes: The node will be re-executed, and the following parameters must be configured:
                                                              • Retry upon Timeout
                                                              • Maximum Retries
                                                              • Retry Interval (seconds)
                                                            • No: The node will not be re-executed. This is the default setting.
                                                              NOTE:

                                                              If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                              If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                              Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                                              @@ -90,6 +90,13 @@

                                                          If you select this option, the node will not be executed, and a success message will be returned.

                                                          Task Groups

                                                          +

                                                          No

                                                          +

                                                          Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                          +
                                                          diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0554.html b/docs/dataartsstudio/umn/dataartsstudio_01_0554.html index 1a638311c..9be19018c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0554.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0554.html @@ -42,7 +42,7 @@

                                                        This parameter is available when you select Flink SQL job for Job Type.

                                                        If the associated SQL script uses a parameter, the parameter name is displayed. Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.

                                                        -

                                                        If the parameters of the associated SQL script are changed, click to refresh the parameters.

                                                        +

                                                        If the parameters of the associated SQL script are changed, click to refresh the parameters.

                                                        Process Type

                                                        @@ -58,8 +58,8 @@

                                                        Yes

                                                        Select the MRS cluster.

                                                        -
                                                        To create an MRS cluster, use either of the following methods:
                                                        • Click . On the Clusters page, create an MRS cluster.
                                                        • Go to the MRS console to create an MRS cluster.
                                                          NOTE:

                                                          Currently, MRS Flink jobs support MRS 3.2.0-LTS.1 and later versions.

                                                          +

                                                        Select an MRS cluster.

                                                        +
                                                        To create an MRS cluster, use either of the following methods:
                                                        • Click . On the Clusters page, create an MRS cluster.
                                                        • Go to the MRS console to create an MRS cluster.
                                                          NOTE:

                                                          Currently, MRS Flink jobs support MRS 3.2.0-LTS.1 and later versions.

                                                        @@ -69,7 +69,8 @@

                                                        Yes

                                                        Name of an MRS job. The name contains 1 to 64 characters, including only letters, digits, and underscores (_).

                                                        +

                                                        MRS job name. It can contain a maximum of 64 characters. Only letters, digits, hyphens (-), and underscores (_) are allowed.

                                                        +

                                                        The system can automatically enter a job name in Job name_Node name format.

                                                        NOTE:

                                                        The job name cannot contain Chinese characters or more than 64 characters. If the job name does not meet requirements, the MRS job will fail to be submitted.

                                                        No

                                                        Select a created MRS resource queue.

                                                        +

                                                        This parameter is mandatory if Whether MRS Resource Queue Is Mandatory is set to Yes.

                                                        NOTE:

                                                        Select a queue you configured in the queue permissions of DataArts Security. If you set multiple resource queues for this node, the resource queue you select here has the highest priority.

                                                        Used to configure optimization parameters such as threads, memory, and vCPUs for the job to optimize resource usage and improve job execution performance.

                                                        NOTE:

                                                        This parameter is mandatory if the cluster version is MRS 1.8.7 or later than MRS 2.0.1.

                                                        -

                                                        For details about the parameters of MRS Flink jobs, see Managing an Existing Cluster > Job Management > Running a Flink Job in MapReduce Service (MRS) User Guide.

                                                        +

                                                        For details about the parameters of MRS Flink jobs, see Managing an Existing Cluster > Job Management > Running a Flink Job in MapReduce Service (MRS) User Guide.

                                                        Input Data Path

                                                        @@ -145,7 +147,7 @@

                                                        Yes

                                                        Whether to re-execute a node if it fails to be executed. Possible values:

                                                        -
                                                        • Yes: The node will be re-executed, and the following parameters must be configured:
                                                          • Retry upon Timeout
                                                          • Maximum Retries
                                                          • Retry Interval (seconds)
                                                          +
                                                          • Yes: The node will be re-executed, and the following parameters must be configured:
                                                            • Retry upon Timeout
                                                            • Maximum Retries
                                                            • Retry Interval (seconds)
                                                          • No: The node will not be re-executed. This is the default setting.
                                                            NOTE:

                                                            If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                            If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                            Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                                            @@ -168,6 +170,13 @@

                                                        If you select this option, the node will not be executed, and a success message will be returned.

                                                        Task Groups

                                                        +

                                                        No

                                                        +

                                                        Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                        +
                                                        diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0555.html b/docs/dataartsstudio/umn/dataartsstudio_01_0555.html index 2789d231e..f447d2856 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0555.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0555.html @@ -9,38 +9,40 @@

                                                        Classification of Scheduling Identities

                                                        Scheduling identities are classified into agencies and IAM accounts.

                                                        • Agencies: Cloud services interwork with each other, and some cloud services are dependent on other services. You can create an agency to delegate cloud services to access other services and perform resource O&M on your behalf.
                                                          Agencies are classified into the following types:
                                                          -
                                                        • IAM accounts: You can configure IAM accounts through user groups in a unified manner and manage permissions in an easier way than agencies. IAM accounts also have better compatibility and support MRS nodes (MRS Presto SQL, MRS Spark, MRS Spark Python, MRS Flink Job, and MRS MapReduce), directly connected nodes (MRS Spark SQL and MRS Hive SQL), and ETL Job nodes whose destination is DWS, so IAM accounts can be used to submit jobs for some MRS clusters and ETL Job nodes that cannot be submitted through agencies.
                                                          IAM accounts are classified into the following types:
                                                          • Public IAM accounts: They apply to all jobs in the workspace. For details about how to configure a public IAM account, see Configuring a Public IAM Account.
                                                          • Execution users: They apply only to a single job. For details about how to configure an execution user, see Configuring an Executor.
                                                          +
                                                        • IAM accounts: You can configure IAM accounts through user groups in a unified manner and manage permissions in an easier way than agencies. IAM accounts also have better compatibility and support MRS nodes (MRS Presto SQL, MRS Spark, MRS Spark Python, MRS Flink Job, and MRS MapReduce), directly connected nodes (MRS Spark SQL and MRS Hive SQL), and ETL Job nodes whose destination is DWS, so IAM accounts can be used to submit jobs for some MRS clusters and ETL Job nodes that cannot be submitted through agencies.
                                                          IAM accounts are classified into the following types:
                                                          • Public IAM accounts: They apply to all jobs in the workspace. For details about how to configure a public IAM account, see Configuring a Public IAM Account.
                                                          • Execution users: They apply only to a single job. For details about how to configure an execution user, see Configuring an Executor.

                                                            You can configure execution users only after apply for the whitelist membership. To use this feature, contact customer service or technical support.

                                                            +
                                                            +

                                                        Priorities of Scheduling Identities

                                                        The system obtains permissions for the job agency, public agency, execution user, and public IAM account in sequence, and then executes jobs with the permissions.

                                                        By default, a job is executed by the user who starts the job. If a job is started by a user without the required permissions, the job fails to be executed due to insufficient permissions. You can configure a scheduling identity to resolve this issue.

                                                        -

                                                        Constraints

                                                        • To create or modify an agency, you must have the Security Administrator permissions.
                                                        • To configure a workspace-level scheduling identity, you must have the DARTS Administrator or Tenant Administrator policy.
                                                        • To configure a job-level agency, you must have the permission to view the list of agencies.
                                                        +

                                                        Constraints

                                                        • To create or modify an agency, you must have the Security Administrator permissions.
                                                        • To configure a workspace-level scheduling identity, you must have the DARTS Administrator or Tenant Administrator policy.
                                                        • To configure a job-level agency, you must have the permission to view the list of agencies.

                                                        Configuring a Public Agency

                                                        A public agency applies to all jobs in the workspace, especially those that contain MRS nodes. Exercise caution when performing this operation.

                                                        -
                                                        1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                        2. In the navigation pane, choose Configuration > Configure.
                                                        3. Choose Scheduling Identities and set Public Scheduling Identity to Public agency.
                                                        4. Click + to select an agency or create one. For how to create an agency and configure permissions, see Reference: Creating an Agency and Reference: Configuring Agency Permissions.
                                                          Figure 1 Configuring a workspace-level agency
                                                          -
                                                        5. Click OK to return to the Scheduling Identities page and click .

                                                          For a batch processing job, a public agency takes effect in the next cycle. For a real-time processing job, you must restart the job for a public agency to take effect.

                                                          +
                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          3. In the navigation pane, choose Configuration > Configure.
                                                          4. Choose Scheduling Identities and set Public Scheduling Identity to Public agency.
                                                          5. Click + to select an agency or create one. For how to create an agency and configure permissions, see Reference: Creating an Agency and Reference: Configuring Agency Permissions.
                                                            Figure 1 Configuring a workspace-level agency
                                                            +
                                                          6. Click OK to return to the Scheduling Identities page and click .

                                                            For a batch processing job, a public agency takes effect in the next cycle. For a real-time processing job, you must restart the job for a public agency to take effect.

                                                          Configuring a Job-Level Agency

                                                          You can create a job-level agency when creating a job. You can also modify the agency of an existing job.

                                                          Configuring an agency when creating a job

                                                          -
                                                          1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          2. In the navigation pane of the DataArts Factory homepage, choose Development > Develop Job.
                                                          3. Right-click the job directory and choose Create Job from the shortcut menu. The Create Job dialog box is displayed. If a workspace-level agency has been configured, it is used for the job by default. You can also select another agency from the agency list. For how to create an agency and configure permissions, see Reference: Creating an Agency and Reference: Configuring Agency Permissions.
                                                            Figure 2 Configuring an agency for a job
                                                            +
                                                            1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            2. In the navigation pane of the DataArts Factory homepage, choose Development > Develop Job.
                                                            3. Right-click the job directory and choose Create Job from the shortcut menu. The Create Job dialog box is displayed. If a workspace-level agency has been configured, it is used for the job by default. You can also select another agency from the agency list. For how to create an agency and configure permissions, see Reference: Creating an Agency and Reference: Configuring Agency Permissions.
                                                              Figure 2 Configuring an agency for a job

                                                              Modifying the agency of an existing job

                                                            1. In the navigation pane of the DataArts Factory homepage, choose Development > Develop Job.
                                                            2. In the job directory, double-click an existing job. On the far right of the displayed page, click Basic Info. The dialog box of the job's basic settings is displayed. If a workspace-level agency has been configured, it is used by default. You can also select another agency from the agency list.
                                                          -

                                                          Configuring a Public IAM Account

                                                          1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          2. In the navigation pane, choose Configuration > Configure.
                                                          3. Choose Scheduling Identities and set Public Scheduling Identity to Public IAM account.
                                                          4. Enter the public IAM account in the text box.
                                                          5. Click .
                                                          +

                                                          Configuring a Public IAM Account

                                                          1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          2. In the navigation pane, choose Configuration > Configure.
                                                          3. Choose Scheduling Identities and set Public Scheduling Identity to Public IAM account.
                                                          4. Enter the public IAM account in the text box.
                                                          5. Click .

                                                          Configuring an Executor

                                                          Configuring a Job Executor

                                                          1. In the job directory, double-click a job.
                                                          2. Click the Basic Info tab and set the executor for the job.

                                                          Reference: Creating an Agency

                                                          1. Log in to the IAM console.
                                                          2. In the navigation pane, choose Agencies and click Create Agency.
                                                          3. Enter an agency name, for example, DGC_agency.
                                                          4. On the displayed page, select Cloud service for Agency Type and Data Lake Governance Center (DGC) for Cloud Service. This grants operation permissions to DataArts Studio so that DataArts Studio can use cloud services and perform O&M for you.

                                                            -
                                                          5. Click Next.
                                                          6. On the Authorize Agency page, search for and select the Tenant Administrator policy. Then click Next.
                                                            • Users assigned the Tenant Administrator policy have all permissions on all services except on IAMIAM. Therefore, delegate the Tenant Administrator policy to DataArts Studio so that DataArts Studio can access all related services.
                                                            • If you want to meet the security control requirements for fewer permissions, you only need to configure the OBS OperateAccess permissions (During job execution, execution log information needs to be written to OBS. Therefore, you need to add the OBS OperateAccess permissions.) Then, configure different agency permissions based on the node type in the job. For example, if a job contains only the Import GES node, you can configure the GES Administrator and OBS OperateAccess permissions. For details, see Reference: Configuring Agency Permissions.
                                                              Figure 3 Assigning permissions
                                                              +
                                                            • Click Next.
                                                            • On the Authorize Agency page, search for and select the Tenant Administrator policy. Then click Next.
                                                              • Users assigned the Tenant Administrator policy have all permissions on all services except on IAMIAM. Therefore, delegate the Tenant Administrator policy to DataArts Studio so that DataArts Studio can access all related services.
                                                              • If you want to meet the security control requirements for fewer permissions, you only need to configure the OBS OperateAccess permissions (During job execution, execution log information needs to be written to OBS. Therefore, you need to add the OBS OperateAccess permissions.) Then, configure different agency permissions based on the node type in the job. For example, if a job contains only the Import GES node, you can configure the GES Administrator and OBS OperateAccess permissions. For details, see Reference: Configuring Agency Permissions.
                                                                Figure 3 Assigning permissions

                                                              @@ -66,7 +68,7 @@

                                                        CDM Job

                                                        DARTS Administrator

                                                        +

                                                        DARTS Administrator

                                                        All DataArts Studio permissions

                                                        MRS Spark SQL, MRS Hive SQL, MRS Kafka, and Kafka Client (connecting to the clusters in proxy mode)

                                                        DARTS Administrator

                                                        +

                                                        DARTS Administrator

                                                        KMS Administrator

                                                        DARTS Administrator has all permissions required for DataArts Studio.

                                                        +

                                                        DARTS Administrator has all permissions required for DataArts Studio.

                                                        Users assigned the KMS Administrator policy have the administrator permissions for encryption keys in DEW.

                                                        DWS SQL, RDS SQL (connecting to data sources in proxy mode), and Shell

                                                        DARTS Administrator

                                                        +

                                                        DARTS Administrator

                                                        KMS Administrator

                                                        DARTS Administrator has all permissions required for DataArts Studio.

                                                        +

                                                        DARTS Administrator has all permissions required for DataArts Studio.

                                                        Users assigned the KMS Administrator policy have the administrator permissions for encryption keys in DEW.

                                                        CSS

                                                        DARTS Administrator

                                                        +

                                                        DARTS Administrator

                                                        Elasticsearch Administrator

                                                        DARTS Administrator has all permissions required for DataArts Studio.

                                                        +

                                                        DARTS Administrator has all permissions required for DataArts Studio.

                                                        Users assigned the Elasticsearch Administrator policy have all permissions for CSS. This role depends on the Tenant Guest and Server Administrator roles in the same project.

                                                        -
                                                      31. Click OK. The system starts to run the PatchData task based on the configured scheduling period.
                                                      32. On the Monitor PatchData page, you can view the PatchData task status, date, number of parallel periods, PatchData job name, and stopped tasks. You can also view details about the PatchData task.

                                                        +
                                                      33. Click OK. The system starts to run the PatchData task based on the configured scheduling period.
                                                      34. On the Monitor PatchData page, you can view the PatchData task status, date, number of parallel periods, PatchData job name, and stopped tasks. You can also view logs of the PatchData task.
                                                        Figure 5 Querying PatchData details
                                                        +

                                                      35. Run the following SQL statement to check whether destination table B contains historical data of source table A:
                                                        SELECT * FROM B
                                                      @@ -117,3 +118,10 @@ INSERT INTO A VALUES ('2','45', '2022-02-27');
                                                    + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0586.html b/docs/dataartsstudio/umn/dataartsstudio_01_0586.html new file mode 100644 index 000000000..1ad9a5ea2 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0586.html @@ -0,0 +1,20 @@ + + +

                                                    Binding or Unbinding an EIP

                                                    +

                                                    Scenario

                                                    After creating a CDM cluster, you can bind an EIP to or unbind an EIP from the cluster.

                                                    +

                                                    If CDM needs to access a local or Internet data source, or a cloud service in another VPC, bind an EIP to the CDM cluster or use a NAT gateway to enable the CDM cluster to share the EIP with ECSs to access the Internet.

                                                    +

                                                    If SSL encryption is configured for the access channel of a local data source, CDM cannot connect to the data source using the EIP.

                                                    +
                                                    +
                                                    +

                                                    Prerequisites

                                                    • You have created a CDM cluster.
                                                    • Your EIP quota is sufficient.
                                                    +
                                                    +

                                                    Procedure

                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
                                                    2. Bind an EIP to or unbind an EIP from a cluster.

                                                      • Binding an EIP: In the Operation column, click Bind EIP. The Bind EIP dialog box is displayed.
                                                      • Unbinding an EIP: In the Operation column, choose More > Unbind EIP.
                                                      +

                                                    3. Click Yes.
                                                    +
                                                    +
                                                    + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0587.html b/docs/dataartsstudio/umn/dataartsstudio_01_0587.html new file mode 100644 index 000000000..abd5533b0 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0587.html @@ -0,0 +1,41 @@ + + +

                                                    Viewing and Modifying CDM Cluster Configurations

                                                    +

                                                    Scenario

                                                    After creating a CDM cluster, you can view its basic information and modify its configurations.

                                                    +
                                                    • You can view the following basic cluster information:
                                                      • Cluster Information: cluster version, creation time, project ID, instance ID, and cluster ID
                                                      • Instance Configuration: cluster flavor, CPU, and memory
                                                      • Network
                                                      +
                                                    • You can modify the following cluster configurations:
                                                      • Notification: If a CDM migration job (only table/file migration) fails or the EIP is abnormal, CDM sends an SMS or email notification to the user.
                                                      • User Isolation: determines whether other users can view and operate the migration jobs and links in the cluster.
                                                        • If this function is enabled, migration jobs and links in the cluster are isolated. Other IAM users of the a cloud platform account cannot view or operate the migration jobs and links in the cluster.

                                                          Starting jobs by group will run all jobs in the group. If user isolation is enabled, starting jobs by group will still run all jobs in the group even if otherIAM users in the a cloud platform account cannot view the jobs in the group. Therefore, you are not advised to start jobs by group in user isolation scenarios.

                                                          +
                                                          +
                                                        • If this function is disabled, migration jobs and links in the cluster can be shared with other users. All IAM users with the required permission in the a cloud platform account can view and operate migration jobs and links.

                                                          After disabling User Isolation, restart the cluster VM for the settings to take effect.

                                                          +
                                                        +
                                                      • Maximum Concurrent Extractors: This parameter specifies the total number of concurrent extractors of a job. If the total number of concurrent extractors of all jobs exceeds the upper limit, the excess extractors will wait in a queue.

                                                        The value of this parameter ranges from 1 to 1000. You are advised to set it based on the cluster specifications. For details about the recommended value, see Maximum Concurrent Extractors. If the number of concurrent extractors is too large, memory overflow may occur. Exercise caution when changing the value.

                                                        +

                                                        This parameter is also available on the Settings tab page. You can change its value either on this page or the Settings page.

                                                        +
                                                        +
                                                      +
                                                    +
                                                    +

                                                    Prerequisites

                                                    You have created a CDM cluster.

                                                    +
                                                    +

                                                    Viewing Basic Cluster Information

                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
                                                    2. Click the cluster name to view its basic information.

                                                      +

                                                      +

                                                    +
                                                    +

                                                    Modifying Cluster Configurations

                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console. On the DataArts Studio console, locate a workspace and click DataArts Migration to access the CDM console.
                                                    1. Click the name of a cluster and click the Cluster Configuration tab to modify Notification, User Isolation and Maximum Concurrent Extractors.

                                                      +

                                                      +

                                                    2. Click Save. The Cluster Management page is displayed.
                                                    3. If User Isolation is disabled, choose More > Restart in the Operation column to restart the cluster VM for the settings to take effect.

                                                      Figure 1 Restarting a cluster
                                                      +
                                                      • Restart CDM service process: Only the CDM service process is restarted. The cluster VM will not be restarted.
                                                      • VM restart: The service process will be interrupted and VMs in the cluster will be restarted.
                                                      +

                                                    4. Select VM restart and click Yes.
                                                    +
                                                    +
                                                    + + + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0589.html b/docs/dataartsstudio/umn/dataartsstudio_01_0589.html new file mode 100644 index 000000000..23471f377 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0589.html @@ -0,0 +1,23 @@ + + +

                                                    Migration in Transaction Mode

                                                    +

                                                    When a CDM job fails to be executed, CDM rolls back the data to the state before the job starts and automatically deletes data from the destination table.

                                                    +
                                                    • Parameter position: When creating a table/file migration job, if the migration source is a relational database, set Import to Staging Table in the advanced attributes of Destination Job Configuration to determine whether to enable the transaction mode.
                                                    • Parameter principle: If you set this parameter to Yes, CDM automatically creates a temporary table and imports the data to the temporary table. After the data is imported successfully, CDM migrates the data to the destination table in transaction mode of the database. If the import fails, the destination table is rolled back to the state before the job starts.
                                                      Figure 1 Migration in transaction mode
                                                      +

                                                      +
                                                    +

                                                    If you select Clear part of data or Clear all data for Clear Data Before Import, CDM does not roll back the deleted data in transaction mode.

                                                    +
                                                    +
                                                    +
                                                    + +
                                                    + + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0590.html b/docs/dataartsstudio/umn/dataartsstudio_01_0590.html new file mode 100644 index 000000000..d1dd6f84c --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0590.html @@ -0,0 +1,32 @@ + + +

                                                    Encryption and Decryption During File Migration

                                                    +
                                                    When you migrate files to a file system, CDM can encrypt and decrypt those files. Currently, CDM supports the following encryption modes: +
                                                    +

                                                    AES-256-GCM

                                                    Currently, only AES-256-GCM (NoPadding) is supported. This algorithm is used for encryption at the migration destination and decryption at the migration source. The supported source and destination data sources are as follows:

                                                    +
                                                    • Data sources supported by the migration source: HDFS (supported in the binary format)
                                                    • Data sources supported by the migration destination: HDFS (supported in the binary format)
                                                    +

                                                    The following part describes how to use AES-256-GCM to decrypt the encrypted files to be exported from HDFS and encrypt the files to be imported to HDFS.

                                                    +
                                                    • Configure decryption at the migration source.
                                                      When you use CDM to create a job for exporting files from HDFS, set the migration source to HDFS and file format to binary, and set the following parameters in the advanced settings of Source Job Configuration:
                                                      1. Encryption: Select AES-256-GCM.
                                                      2. DEK: The key must be the same as that configured in encryption. Otherwise, the decrypted data is incorrect and the system does not display an error message.
                                                      3. IV: The initialization vector must be the same as that configured in encryption. Otherwise, the decrypted data is incorrect and the system does not display an error message.
                                                      +
                                                      +

                                                      In this way, after CDM exports encrypted files from HDFS, the files written to the migration destination are decrypted plaintext files.

                                                      +
                                                    +
                                                    • Configure encryption at the migration destination.
                                                      When you create a CDM job to import files to HDFS, set the migration destination to HDFS and file format to binary, and set the following parameters in the advanced settings of Destination Job Configuration:
                                                      1. Encryption: Select AES-256-GCM.
                                                      2. DEK: custom encryption key. The key consists of 64 hexadecimal numbers. It is case-insensitive but must contain 64 characters. For example, DD0AE00DFECD78BF051BCFDA25BD4E320DB0A7AC75A1F3FC3D3C56A457DCDC1B.
                                                      3. IV: custom initialization vector. The initialization vector consists of 32 hexadecimal numbers. It is case-insensitive but must contain 32 characters. For example, 5C91687BA886EDCD12ACBC3FF19A3C3F.
                                                      +
                                                      +

                                                      In this way, after CDM imports files to HDFS, the files in the destination HDFS are encrypted using the AES-256-GCM algorithm.

                                                      +
                                                    +
                                                    +

                                                    KMS Encryption

                                                    The migration source does not support KMS encryption.

                                                    +
                                                    +

                                                    CDM supports KMS encryption if tables, files, or a whole database is migrated to OBS. In the Advanced Attributes area of the Destination Job Configuration page, set the parameters.

                                                    +

                                                    A key must be created in KMS of DEW in advance. For details, see the Data Encryption Workshop User Guide.

                                                    +

                                                    After KMS encryption is enabled, objects to be uploaded will be encrypted and stored on OBS. When you download the encrypted objects, the encrypted data will be decrypted on the server and displayed in plaintext to users.

                                                    +
                                                    • If KMS encryption is enabled, MD5 verification cannot be used.
                                                    • If the KMS ID of another project is used, change Project ID to the ID of the project to which KMS belongs. If KMS and CDM are in the same project, retain the default value of Project ID.
                                                    • After KMS encryption is performed, the encryption status of the objects on OBS cannot be changed.
                                                    • A key in use cannot be deleted. Otherwise, the object encrypted with this key cannot be downloaded.
                                                    +
                                                    +
                                                    +
                                                    +
                                                    + +
                                                    + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0591.html b/docs/dataartsstudio/umn/dataartsstudio_01_0591.html new file mode 100644 index 000000000..e143a7460 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0591.html @@ -0,0 +1,18 @@ + + +

                                                    MD5 Verification

                                                    +

                                                    CDM extracts data from the migration source and writes the data to the migration destination. Figure 1 shows the migration mode when files are migrated to OBS.

                                                    +
                                                    Figure 1 Migrating files to OBS
                                                    +

                                                    During the process, CDM uses MD5 to verify file consistency.

                                                    +
                                                    • Extract
                                                      • The migration source can be OBS, HDFS, FTP, SFTP, or HTTP. It can check whether the files extracted by CDM are consistent with source files.
                                                      • This function is controlled by the MD5 File Extension parameter (available when File Format is set to Binary) in Source Job Configuration. Set this parameter to the file name extension of the MD5 file in the source file system.
                                                      • If a source file build.sh and a file for saving MD5 value build.sh.md5 are located in the same directory, and MD5 File Extension is configured, only the file build.sh.md5 is migrated to the destination. Files without the MD5 value or whose MD5 values do not match fail to be migrated, and the MD5 file is not migrated.
                                                      • If MD5 File Extension is not configured, all files are migrated.
                                                      +
                                                    • Write
                                                      • Currently, this function can be used only when OBS serves as the migration destination. It can check whether the files written to OBS are consistent with those extracted from CDM.
                                                      • This function is controlled by the Validate MD5 Value parameter in Destination Job Configuration. After the files are read and written to OBS, the MD5 value in the HTTP header is used to verify the files on OBS and the verification result is written to an OBS bucket (the bucket can be the one that does not store migration files). If the migration source does not have the MD5 file, the verification will not be performed.
                                                      +
                                                    +
                                                    • When files are migrated to a file system, only the extracted files are verified.
                                                    • When files are migrated to OBS, both the extracted files and files written to OBS are verified.
                                                    • If MD5 verification is used, KMS encryption cannot be used.
                                                    +
                                                    +
                                                    +
                                                    + +
                                                    + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0105.html b/docs/dataartsstudio/umn/dataartsstudio_01_0592.html similarity index 78% rename from docs/dataartsstudio/umn/dataartsstudio_01_0105.html rename to docs/dataartsstudio/umn/dataartsstudio_01_0592.html index 514d0c7ab..ae6b4f803 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0105.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0592.html @@ -1,10 +1,10 @@ - +

                                                    Migrating Files with Specified Names

                                                    -

                                                    You can migrate files (a maximum of 50) with specified names from FTP, OBS, or SFTP at a time. The exported files can only be written to the same directory on the migration destination.

                                                    -

                                                    When creating a table/file migration job, if the migration source is FTP, OBS, or SFTP, Source Directory/File can contain a maximum of 50 file names, which are separated by vertical bars (|). You can also customize a file separator.

                                                    -
                                                    1. CDM supports incremental file migration (by skipping repeated files), but does not support resumable transfer.

                                                      For example, if three files are to be migrated and the second file fails to be migrated due to the network fault. When the migration task is started again, the first file is skipped. The second file, however, cannot be migrated from the point where the fault occurs, but can only be migrated again.

                                                      -
                                                    2. During file migration, a single task supports millions of files. If there are too many files in the directory to be migrated, you are advised to split the files into different directories and create multiple tasks.
                                                    +

                                                    You can migrate files (a maximum of 50) with specified names from FTP, OBS, or SFTP at a time. The exported files can only be written to the same directory on the migration destination.

                                                    +

                                                    When creating a table/file migration job, if the migration source is FTP, OBS, or SFTP, Source Directory/File can contain a maximum of 50 file names, which are separated by vertical bars (|). You can also customize a file separator.

                                                    +
                                                    1. CDM supports incremental file migration (by skipping repeated files), but does not support resumable transfer.

                                                      For example, if three files are to be migrated and the second file fails to be migrated due to the network fault. When the migration task is started again, the first file is skipped. The second file, however, cannot be migrated from the point where the fault occurs, but can only be migrated again.

                                                      +
                                                    2. During file migration, a single task supports millions of files. If there are too many files in the directory to be migrated, you are advised to split the files into different directories and create multiple tasks.
                                                    diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0106.html b/docs/dataartsstudio/umn/dataartsstudio_01_0593.html similarity index 63% rename from docs/dataartsstudio/umn/dataartsstudio_01_0106.html rename to docs/dataartsstudio/umn/dataartsstudio_01_0593.html index dafb25fd0..2ea6fa6a1 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0106.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0593.html @@ -1,38 +1,39 @@ - +

                                                    Regular Expressions for Separating Semi-structured Text

                                                    -

                                                    During table/file migration, CDM uses delimiters to separate fields in CSV files. However, delimiters cannot be used in complex semi-structured data because the field values also contain delimiters. In this case, the regular expression can be used to separate the fields.

                                                    -

                                                    The regular expression is configured in Source Job Configuration. The migration source must be an object storage or file system, and File Format must be CSV.

                                                    -
                                                    Figure 1 Setting regular expression parameters
                                                    -
                                                    During the migration of CSV files, CDM can use regular expressions to separate fields and write parsed results to the migration destination. For details about the syntax of the regular expression, refer to the related documents. This section describes the regular expressions of the following log files: +

                                                    During table/file migration, CDM uses delimiters to separate fields in CSV files. However, delimiters cannot be used in complex semi-structured data because the field values also contain delimiters. In this case, the regular expression can be used to separate the fields.

                                                    +

                                                    The regular expression is configured in Source Job Configuration. The migration source must be an object storage or file system, and File Format must be CSV.

                                                    +
                                                    Figure 1 Setting regular expression parameters
                                                    +

                                                    +
                                                    During the migration of CSV files, CDM can use regular expressions to separate fields and write parsed results to the migration destination. For details about the syntax of the regular expression, refer to the related documents. This section describes the regular expressions of the following log files:
                                                    -

                                                    Log4J Log

                                                    • Log sample:
                                                      2018-01-11 08:50:59,001 INFO  [org.apache.sqoop.core.SqoopConfiguration.configureClassLoader(SqoopConfiguration.java:251)] Adding jars to current classloader from property: org.apache.sqoop.classpath.extra
                                                      -
                                                    • Regular expression:
                                                      ^(\d.*\d) (\w*)  \[(.*)\] (\w.*).*
                                                      -
                                                    • Parsing result: -
                                                      - - - @@ -94,7 +94,7 @@
                                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1215.html b/docs/dataartsstudio/umn/dataartsstudio_01_1215.html deleted file mode 100644 index 81ddec889..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1215.html +++ /dev/null @@ -1,118 +0,0 @@ - - -

                                                      Link to Doris

                                                      -

                                                      CDM can connect to open-source Doris and MRS Doris. Table 1 lists the parameters for a Doris link.

                                                      -

                                                      Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

                                                      -
                                                      - -
                                                      Table 1 Log4J log parsing result

                                                      Column Number

                                                      +

                                                      Log4J Log

                                                      • Log sample:
                                                        2018-01-11 08:50:59,001 INFO  [org.apache.sqoop.core.SqoopConfiguration.configureClassLoader(SqoopConfiguration.java:251)] Adding jars to current classloader from property: org.apache.sqoop.classpath.extra
                                                        +
                                                      • Regular expression:
                                                        ^(\d.*\d) (\w*)  \[(.*)\] (\w.*).*
                                                        +
                                                      • Parsing result: +
                                                        - - - - - - - - - @@ -40,53 +41,53 @@ -

                                                        Log4J Audit Log

                                                        • Log sample:
                                                          2018-01-11 08:51:06,156 INFO  [org.apache.sqoop.audit.FileAuditLogger.logAuditEvent(FileAuditLogger.java:61)] user=sqoop.anonymous.user    ip=189.xxx.xxx.75    op=show    obj=version    objId=x
                                                          -
                                                        • Regular expression:
                                                          ^(\d.*\d) (\w*)  \[(.*)\] user=(\w.*)    ip=(\w.*)    op=(\w.*)    obj=(\w.*)    objId=(.*).*
                                                          -
                                                        • Parsing result: -
                                                        Table 1 Log4J log parsing result

                                                        Column Number

                                                        Example Value

                                                        +

                                                        Example Value

                                                        1

                                                        +

                                                        1

                                                        2018-01-11 08:50:59,001

                                                        +

                                                        2018-01-11 08:50:59,001

                                                        2

                                                        +

                                                        2

                                                        INFO

                                                        +

                                                        INFO

                                                        3

                                                        +

                                                        3

                                                        org.apache.sqoop.core.SqoopConfiguration.configureClassLoader(SqoopConfiguration.java:251)

                                                        +

                                                        org.apache.sqoop.core.SqoopConfiguration.configureClassLoader(SqoopConfiguration.java:251)

                                                        4

                                                        +

                                                        4

                                                        Adding jars to current classloader from property: org.apache.sqoop.classpath.extra

                                                        +

                                                        Adding jars to current classloader from property: org.apache.sqoop.classpath.extra

                                                        - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1207.html b/docs/dataartsstudio/umn/dataartsstudio_01_1207.html index 7bd665f24..37ed1a4fc 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1207.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1207.html @@ -7,7 +7,7 @@ - - - @@ -109,12 +109,12 @@ - - @@ -122,7 +122,8 @@ - - - @@ -90,38 +90,54 @@ - - - - - - - - - - + + + + + + + + + + + + + + + +
                                                        Table 2 Log4J audit log parsing result

                                                        Column Number

                                                        +

                                                        Log4J Audit Log

                                                        • Log sample:
                                                          2018-01-11 08:51:06,156 INFO  [org.apache.sqoop.audit.FileAuditLogger.logAuditEvent(FileAuditLogger.java:61)] user=sqoop.anonymous.user    ip=189.xxx.xxx.75    op=show    obj=version    objId=x
                                                          +
                                                        • Regular expression:
                                                          ^(\d.*\d) (\w*)  \[(.*)\] user=(\w.*)    ip=(\w.*)    op=(\w.*)    obj=(\w.*)    objId=(.*).*
                                                          +
                                                        • Parsing result: +
                                                          - - - - - - - - - - - - - - - - - @@ -94,39 +95,39 @@ -

                                                          Tomcat Log

                                                          • Log sample:
                                                            11-Jan-2018 09:00:06.907 INFO [main] org.apache.catalina.startup.VersionLoggerListener.log OS Name:               Linux
                                                            +

                                                            Tomcat Log

                                                            • Log sample:
                                                              11-Jan-2018 09:00:06.907 INFO [main] org.apache.catalina.startup.VersionLoggerListener.log OS Name:               Linux
                                                            -
                                                            • Regular expression:
                                                              ^(\d.*\d) (\w*) \[(.*)\] ([\w\.]*) (\w.*).*
                                                              -
                                                            • Parsing result: -
                                                          Table 2 Log4J audit log parsing result

                                                          Column Number

                                                          Example Value

                                                          +

                                                          Example Value

                                                          1

                                                          +

                                                          1

                                                          2018-01-11 08:51:06,156

                                                          +

                                                          2018-01-11 08:51:06,156

                                                          2

                                                          +

                                                          2

                                                          INFO

                                                          +

                                                          INFO

                                                          3

                                                          +

                                                          3

                                                          org.apache.sqoop.audit.FileAuditLogger.logAuditEvent(FileAuditLogger.java:61)

                                                          +

                                                          org.apache.sqoop.audit.FileAuditLogger.logAuditEvent(FileAuditLogger.java:61)

                                                          4

                                                          +

                                                          4

                                                          sqoop.anonymous.user

                                                          +

                                                          sqoop.anonymous.user

                                                          5

                                                          +

                                                          5

                                                          189.xxx.xxx.75

                                                          +

                                                          189.xxx.xxx.75

                                                          6

                                                          +

                                                          6

                                                          show

                                                          +

                                                          show

                                                          7

                                                          +

                                                          7

                                                          version

                                                          +

                                                          version

                                                          8

                                                          +

                                                          8

                                                          x

                                                          +

                                                          x

                                                          - - - - - - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1101.html b/docs/dataartsstudio/umn/dataartsstudio_01_1101.html index 1f0f79d10..a48c8eb47 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1101.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1101.html @@ -2,13 +2,9 @@

                                                          Changing the Job Owner

                                                          DataArts Factory allows you to change the job owner with a few clicks.

                                                          -

                                                          Procedure

                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                          4. At the top of the job directory, click and select Configure Owner.
                                                            Figure 1 Changing the owner
                                                            +

                                                            Procedure

                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                            2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                            4. At the top of the job directory, click and select Configure Owner.
                                                              Figure 1 Changing the owner
                                                            5. Set Current Owner and Target Owner and click Migrate.
                                                            6. When the owner is changed, click Close.
                                                            -

                                                            Related Operations

                                                            You can use an owner to filter jobs by entering the owner in the search box above the job directory.

                                                            -
                                                            Figure 2 Filtering jobs by owner
                                                            -

                                                            -
                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1102.html b/docs/dataartsstudio/umn/dataartsstudio_01_1102.html index 2f144c517..1f8b30c06 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1102.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1102.html @@ -2,12 +2,9 @@

                                                          Changing the Script Owner

                                                          DataArts Factory allows you to change the script owner with a few clicks.

                                                          -

                                                          Procedure

                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                          4. At the top of the script directory, click and select Configure Owner.
                                                            Figure 1 Changing the owner
                                                            +

                                                            Procedure

                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                            2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                            4. At the top of the script directory, click and select Configure Owner.
                                                              Figure 1 Changing the owner
                                                            5. Set Current Owner and Target Owner and click Migrate.
                                                            6. When the owner is changed, click Close.
                                                            -

                                                            Related Operations

                                                            You can use an owner to filter scripts by entering the owner in the search box above the script directory.

                                                            -
                                                            Figure 2 Filtering scripts by owner
                                                            -
                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1104.html b/docs/dataartsstudio/umn/dataartsstudio_01_1104.html new file mode 100644 index 000000000..1f26d4223 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1104.html @@ -0,0 +1,207 @@ + + +

                                                          MRS Impala SQL

                                                          +

                                                          Functions

                                                          The MRS Impala SQL node is used to execute the Impala SQL script predefined in DataArts Factory.

                                                          +
                                                          +

                                                          Parameters

                                                          Table 1 and Table 2 describe the parameters of the MRS Impala node.

                                                          + +
                                                          Table 3 Tomcat log parsing result

                                                          Column Number

                                                          +
                                                          • Regular expression:
                                                            ^(\d.*\d) (\w*) \[(.*)\] ([\w\.]*) (\w.*).*
                                                            +
                                                          • Parsing result: +
                                                            - - - - - - - - - - - @@ -134,33 +135,33 @@ -

                                                            Django Log

                                                            • Log sample:
                                                              [08/Jan/2018 20:59:07 ] settings     INFO     Welcome to Hue 3.9.0
                                                              -
                                                            • Regular expression:
                                                              ^\[(.*)\] (\w*)     (\w*)     (.*).*
                                                              -
                                                            • Parsing result: -
                                                            Table 3 Tomcat log parsing result

                                                            Column Number

                                                            Example Value

                                                            +

                                                            Example Value

                                                            1

                                                            +

                                                            1

                                                            11-Jan-2018 09:00:06.907

                                                            +

                                                            11-Jan-2018 09:00:06.907

                                                            2

                                                            +

                                                            2

                                                            INFO

                                                            +

                                                            INFO

                                                            3

                                                            +

                                                            3

                                                            main

                                                            +

                                                            main

                                                            4

                                                            +

                                                            4

                                                            org.apache.catalina.startup.VersionLoggerListener.log

                                                            +

                                                            org.apache.catalina.startup.VersionLoggerListener.log

                                                            5

                                                            +

                                                            5

                                                            OS Name:Linux

                                                            +

                                                            OS Name:Linux

                                                            + + + +
                                                            Table 4 Django log parsing result

                                                            Column Number

                                                            +

                                                            Django Log

                                                            • Log sample:
                                                              [08/Jan/2018 20:59:07 ] settings     INFO     Welcome to Hue 3.9.0
                                                              +
                                                            • Regular expression:
                                                              ^\[(.*)\] (\w*)     (\w*)     (.*).*
                                                              +
                                                            • Parsing result: +
                                                              - - - - - - - - - @@ -168,33 +169,33 @@ -

                                                              Apache Server Log

                                                              • Log sample:
                                                                [Mon Jan 08 20:43:51.854334 2018] [mpm_event:notice] [pid 36465:tid 140557517657856] AH00489: Apache/2.4.12 (Unix) OpenSSL/1.0.1t configured -- resuming normal operations
                                                                -
                                                              • Regular expression:
                                                                ^\[(.*)\] \[(.*)\] \[(.*)\] (.*).*
                                                                -
                                                              • Parsing result: -
                                                              Table 4 Django log parsing result

                                                              Column Number

                                                              Example Value

                                                              +

                                                              Example Value

                                                              1

                                                              +

                                                              1

                                                              08/Jan/2018 20:59:07

                                                              +

                                                              08/Jan/2018 20:59:07

                                                              2

                                                              +

                                                              2

                                                              settings

                                                              +

                                                              settings

                                                              3

                                                              +

                                                              3

                                                              INFO

                                                              +

                                                              INFO

                                                              4

                                                              +

                                                              4

                                                              Welcome to Hue 3.9.0

                                                              +

                                                              Welcome to Hue 3.9.0

                                                              - - @@ -65,15 +65,22 @@
                                                              • A cluster configuration file contains the configuration parameters of the cluster. If the cluster configuration parameters are modified, you need to obtain the configuration file again.
                                                              • The keytab file is the authentication credential file. Before obtaining the keytab file, you need to change the password of this user at least once in the cluster. Otherwise, the downloaded keytab file may be unavailable. After a user password is changed, the exported keytab file becomes invalid, and you need to export a keytab file again.
                                                              • The keytab file is used only in a cluster in security mode. In other cases, you do not need to prepare the keytab file.
                                                              -

                                                              Procedure

                                                              1. On the CDM console, choose Cluster Management in the left navigation pane. Locate the row that contains a cluster and choose Job Management > Links > Cluster Configurations.
                                                              2. On the Cluster Configurations page, click Create Cluster Configuration and set the parameters as prompt.
                                                                Figure 2 Creating cluster configurations
                                                                +

                                                                Procedure

                                                                1. On the CDM console, choose Cluster Management in the left navigation pane. Locate the row that contains a cluster and choose Job Management > Links > Cluster Configurations.
                                                                2. On the Cluster Configurations page, click Create Cluster Configuration and set the parameters as prompt.
                                                                  Figure 2 Creating cluster configurations
                                                                  • Configuration Name: Enter a cluster configuration name that is easy to remember and distinguish based on the type of the data source to be connected.
                                                                  • Configuration File: Click Select File to select a local cluster configuration file, and then click Upload on the right to upload the file.
                                                                  • Principal: This parameter is required only for clusters in security mode. Principal is the username in Kerberos security mode and must be the same as that in the keytab file.
                                                                  • Keytab File: Upload the keytab file only for clusters in security mode. Click Select File to select a local keytab file, and then click Upload on the right to upload the file.
                                                                  • Description: Add a description to identify and distinguish the cluster configuration.
                                                                  -
                                                                3. Click OK. When creating a Hadoop link, set Authentication Method as required, Use Cluster Config to Yes, and then select the corresponding cluster configuration name to quickly create a Hadoop link.
                                                                  Figure 3 Use Cluster Config
                                                                  +
                                                                4. Click OK. When creating a Hadoop link, set Authentication Method as required, Use Cluster Config to Yes, and then select the corresponding cluster configuration name to quickly create a Hadoop link.
                                                                  Figure 3 Use Cluster Config
                                                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1097.html b/docs/dataartsstudio/umn/dataartsstudio_01_1097.html index 142556ceb..9b97b9465 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1097.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1097.html @@ -4,15 +4,15 @@

                                                              You can view a job dependency graph to learn the upstream and downstream jobs associated with the job.

                                                              Prerequisites

                                                              Dependent jobs have been configured in the job scheduling configuration in Developing a Pipeline Job. Otherwise, only the current job node can be displayed in the view, and the associated upstream and downstream job nodes cannot be displayed.

                                                              -

                                                              Procedure

                                                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                              4. In the job directory, right-click the job you want to view and choose View Job Dependency Graph from the shortcut menu.
                                                                Figure 1 Job Dependency page
                                                                +

                                                                Procedure

                                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                4. In the job directory, right-click the job you want to view and choose View Job Dependency Graph from the shortcut menu.
                                                                  Figure 1 Job Dependency page

                                                                  -
                                                                5. On the displayed Job Dependency page, perform any of the following operations:
                                                                  • In the upper right corner, select Display complete dependency graphs, Display the current job and its upstream and downstream jobs, or Display the current job and its directly connected jobs.
                                                                  • In the search box in the upper right corner, you can enter the name of a node to search for the node. The node found will be highlighted.
                                                                  • Click Download to download the job dependency file.
                                                                  • Scroll your mouse wheel to zoom in or zoom out the dependency graph.
                                                                  • Drag the blank area to view the complete relationship graph.
                                                                  • When the cursor is hovered on a job node, the node is marked green, its upstream job is marked blue, and its downstream job is marked yellow.
                                                                    Figure 2 Marking upstream and downstream job nodes of a node
                                                                    -
                                                                  • Right-click a job node to view the job, copy the job name, and collapse upstream or downstream jobs.
                                                                    Figure 3 Job node operations
                                                                    +
                                                                  • On the displayed Job Dependency page, perform any of the following operations:
                                                                    • In the upper right corner, select Display complete dependency graphs, Display the current job and its upstream and downstream jobs, or Display the current job and its directly connected jobs.
                                                                    • In the search box in the upper right corner, you can enter the name of a node to search for the node. The node found will be highlighted.
                                                                    • Click Download to download the job dependency file.
                                                                    • Scroll your mouse wheel to zoom in or zoom out the dependency graph.
                                                                    • Drag the blank area to view the complete relationship graph.
                                                                    • When the cursor is hovered on a job node, the node is marked green, its upstream job is marked blue, and its downstream job is marked yellow.
                                                                      Figure 2 Marking upstream and downstream job nodes of a node
                                                                      +
                                                                    • Right-click a job node to view the job, copy the job name, and collapse upstream or downstream jobs.
                                                                      Figure 3 Job node operations

                                                                -

                                                                Viewing a Job Dependency Graph

                                                                1. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                2. Right-click the job directory and select View Job Dependency Graph.
                                                                  Figure 4 Viewing the job dependency graph
                                                                  +

                                                                  Viewing a Job Dependency Graph

                                                                  1. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                  2. Right-click the job directory and select View Job Dependency Graph.
                                                                    Figure 4 Viewing the job dependency graph

                                                                  3. The system displays the dependencies between all the jobs in the directory. You can search for jobs by name. The matched jobs will be highlighted.
                                                                    • If you click a node in the dependency graph, its upstream jobs are marked blue and its downstream jobs are marked yellow.
                                                                    • You can drag to view the full dependency graph.
                                                                    • Scroll the mouse wheel to zoom in or out the dependency graph.
                                                                    @@ -25,3 +25,10 @@
                                                                + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1098.html b/docs/dataartsstudio/umn/dataartsstudio_01_1098.html index e6efeaf19..638509dc1 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1098.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1098.html @@ -99,6 +99,13 @@
                                                              + + + +
                                                              Table 5 Apache server log parsing result

                                                              Column Number

                                                              +

                                                              Apache Server Log

                                                              • Log sample:
                                                                [Mon Jan 08 20:43:51.854334 2018] [mpm_event:notice] [pid 36465:tid 140557517657856] AH00489: Apache/2.4.12 (Unix) OpenSSL/1.0.1t configured -- resuming normal operations
                                                                +
                                                              • Regular expression:
                                                                ^\[(.*)\] \[(.*)\] \[(.*)\] (.*).*
                                                                +
                                                              • Parsing result: +
                                                                - - - - - - - - - @@ -209,3 +210,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0816.html b/docs/dataartsstudio/umn/dataartsstudio_01_0816.html index b27586f2f..e419b2e97 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0816.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0816.html @@ -28,14 +28,14 @@ - - @@ -49,7 +49,7 @@ @@ -130,7 +130,7 @@ - - @@ -280,7 +280,7 @@ @@ -333,7 +333,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0901.html b/docs/dataartsstudio/umn/dataartsstudio_01_0901.html index eadee99c9..0e51ed2f4 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0901.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0901.html @@ -7,9 +7,8 @@

                                                                Prerequisites

                                                                A script has been developed.

                                                                Submitting a Script Version

                                                                If you submit a version, the latest script in the development state will be saved and submitted and overwrite the previous script version.

                                                                -
                                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                4. In the script directory, double-click the developed script to access the script development page.
                                                                5. Above the script editor, click Submit to submit a version. In the displayed dialog box, select the reviewer, enter the change description (a maximum of 128 characters allowed), and select the check box below. If you do not select this option, you cannot click OK. When submitting a version, you can click Compare Version to view the differences between the current version and the last version.

                                                                  Figure 1 Submitting a version
                                                                  -

                                                                  -
                                                                  • If review is enabled on the Review Center page, your submitted version will be reviewed by the workspace admin on the Pending Review tab page on the Review Center page. The version is submitted successfully only after it is approved by the admin. For details, see Approval Settings.

                                                                    To revoke a submitted request, go to the Review Center page and click the My Applications tab. Then you can submit an application again.

                                                                    +
                                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                    3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                    4. In the script directory, double-click the developed script to access the script development page.
                                                                    5. Above the script editor, click Submit to submit a version. In the displayed dialog box, select the reviewer, enter the change description (a maximum of 128 characters allowed), and select the check box below. If you do not select this option, you cannot click OK. When submitting a version, you can click Compare Version to view the differences between the current version and the last version.

                                                                      Figure 1 Submitting a version
                                                                      +
                                                                      • If review is enabled on the Review Center page, your submitted version will be reviewed by the reviewer on the Pending Review tab page on the Review Center page. The version is submitted successfully only after it is approved by the reviewer. For details, see Approval Settings. If review is disabled, the version can be directly submitted.

                                                                        To revoke a submitted request, go to the Review Center page and click the My Applications tab. Then you can submit an application again.

                                                                      • If review is enabled, the following operations need to be reviewed: submitting scripts, deleting scripts, and importing submitted scripts.
                                                                      • Before disabling the review function, ensure that there are no requests pending review in the current workspace.
                                                                      • The enterprise mode does not support the review function.

                                                                    @@ -18,16 +17,16 @@
                                                                    The rollback involves the following contents:
                                                                    • DLI: data connections, databases, resource queues, and script contents
                                                                    • DWS: data connections, databases, and script contents
                                                                    • HIVE: data connections, databases, resource queues, and script contents
                                                                    • SPARK: data connections, databases, and script contents
                                                                    • SHELL: host connections, parameters, interactive parameters, and script contents
                                                                    • RDS: data connections, databases, and script contents
                                                                    • PRESTO: data connections, modes, and script contents
                                                                    • PYTHON: host connections, parameters, interactive parameters, and script content
                                                                    • FLINK: script content

                                                                    The procedure is as follows:

                                                                    -
                                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                    3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                    4. In the script directory list, double-click a script that you want to develop. The script development page is displayed.
                                                                    5. On the right of the page, click the Versions tab and view the version submission records. Select the version to be rolled back and click Roll Back.
                                                                      If the content in the development state is not submitted, the content will be overwritten after the rollback. In this case, you must submit the rollback version again to make it take effect. By default, the latest submitted version is used for scheduling.
                                                                      Figure 2 Rolling back a version
                                                                      +
                                                                      1. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                      2. In the script directory list, double-click a script that you want to develop. The script development page is displayed.
                                                                      3. On the right of the page, click the Versions tab and view the version submission records. Select the version to be rolled back and click Roll Back.
                                                                        If the content in the development state is not submitted, the content will be overwritten after the rollback. In this case, you must submit the rollback version again to make it take effect. By default, the latest submitted version is used for scheduling.
                                                                        Figure 2 Rolling back a version

                                                                      Version Comparison

                                                                      You can compare the script contents of two different versions. If you select only one version, the system compares the script content of the selected version with that in the development state. If you select two versions, the system compares the script contents of two different versions.

                                                                      The procedure is as follows:

                                                                      -
                                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                      2. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                      3. In the script directory list, double-click a script that you want to develop. The script development page is displayed.
                                                                      4. On the right of the page, click the Versions tab and view the version submission records. Select the versions to be compared and click Compare Version.
                                                                        Figure 3 Comparing versions
                                                                        +
                                                                        1. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                        2. In the script directory list, double-click a script that you want to develop. The script development page is displayed.
                                                                        3. On the right of the page, click the Versions tab and view the version submission records. Select the versions to be compared and click Compare Version.
                                                                          Figure 3 Comparing versions

                                                                          -
                                                                        4. A new page is displayed, showing the script content of different versions on the left and right separately. The differences between the two versions have been marked. You can use the and buttons in the upper right corner to go to the previous or next change.
                                                                          Figure 4 Version comparison details
                                                                          +
                                                                        5. A new page is displayed, showing the script content of different versions on the left and right separately. The differences between the two versions have been marked. You can use the and buttons in the upper right corner to go to the previous or next change.
                                                                          Figure 4 Version comparison details
                                                                  @@ -37,3 +36,10 @@
                                                                + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0902.html b/docs/dataartsstudio/umn/dataartsstudio_01_0902.html index 5bdbffcb8..35ab3744b 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0902.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0902.html @@ -7,9 +7,8 @@

                                                                Prerequisites

                                                                A job has been developed.

                                                                Submitting a Job Version

                                                                If you submit a version, the latest job in the development state will be saved and submitted and overwrite the previous job version.

                                                                -
                                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                4. In the job directory, double-click the developed job to access the job development page.
                                                                5. Above the job canvas or editor, click Submit to submit a version. In the displayed dialog box, select the reviewer, enter the change description (a maximum of 128 characters allowed), and select the check box below. If you do not select this option, you cannot click OK. When submitting a version, you can click Compare Version to view the differences between the current version and the last version.

                                                                  Figure 1 Submitting a version
                                                                  -

                                                                  -
                                                                  • If review is enabled on the Review Center page, your submitted version will be reviewed by the workspace admin on the Pending Review tab page on the Review Center page. The version is submitted successfully only after it is approved by the admin. For details, see Approval Settings.

                                                                    To revoke a submitted request, go to the Review Center page and click the My Applications tab. Then you can submit an application again.

                                                                    +
                                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                    3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                    4. In the job directory, double-click the developed job to access the job development page.
                                                                    5. Above the job canvas or editor, click Submit to submit a version. In the displayed dialog box, select the reviewer, enter the change description (a maximum of 128 characters allowed), and select the check box below. If you do not select this option, you cannot click OK. When submitting a version, you can click Compare Version to view the differences between the current version and the last version.

                                                                      Figure 1 Submitting a version
                                                                      +
                                                                      • If review is enabled on the Review Center page, your submitted version will be reviewed by the reviewer on the Pending Review tab page on the Review Center page. The version is submitted successfully only after it is approved by the reviewer. For details, see Approval Settings. If review is disabled, the version can be directly submitted.

                                                                        To revoke a submitted request, go to the Review Center page and click the My Applications tab. Then you can submit an application again.

                                                                      • If review is enabled, the following operations need to be reviewed: submitting jobs, deleting jobs, and importing submitted jobs.
                                                                      • Before disabling the review function, ensure that there are no requests pending review in the current workspace.
                                                                      • The enterprise mode does not support the review function.

                                                                    @@ -18,20 +17,17 @@

                                                                    The rollback involves the following contents:

                                                                    • Job definition (such as operator properties and connection lines)
                                                                    • Basic job information, job scheduling configuration, job parameters, and lineage

                                                                    The procedure is as follows:

                                                                    -
                                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                    3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                    4. In the job directory, double-click a job to access the job development page.
                                                                    5. On the right of the page, click the Versions tab and view the version submission records. Select the version to be rolled back and click Roll Back.
                                                                      Figure 2 Rolling back the version
                                                                      -

                                                                      +
                                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                      3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                      4. In the job directory, double-click a job to access the job development page.
                                                                      5. On the right of the page, click the Versions tab and view the version submission records. Select the version to be rolled back and click Roll Back.
                                                                        Figure 2 Rolling back the version

                                                                  Viewing Version Details

                                                                  You can view the submitted version information in the version list.

                                                                  The procedure is as follows:

                                                                  -
                                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                  2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                  3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                  4. In the job directory, double-click a job to access the job development page.
                                                                  5. On the right of the page, click the Versions tab and view the version submission records. Select the desired version and click View to view its details.
                                                                    A new page is displayed, showing the job definition of the version. You cannot modify any job attributes in this window.
                                                                    Figure 3 Viewing version details
                                                                    +
                                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                    3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                    4. In the job directory, double-click a job to access the job development page.
                                                                    5. On the right of the page, click the Versions tab and view the version submission records. Select the desired version and click View to view its details.
                                                                      A new page is displayed, showing the job definition of the version. You cannot modify any job attributes in this window.
                                                                      Figure 3 Viewing version details
                                                                      -

                                                                    -

                                                                    Version Comparison

                                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                    3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                    4. In the job directory, double-click a job to access the job development page.
                                                                    5. On the right of the page, click the Versions tab and view the version submission records. Select the versions to be compared and click Compare Version.

                                                                      If you select only one version, the selected version is compared with the JSON of the development-state job. If you select two versions, the JSON of the two versions is compared.

                                                                      -
                                                                      Figure 4 Comparing versions
                                                                      -

                                                                      +

                                                                      Version Comparison

                                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                      3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                      4. In the job directory, double-click a job to access the job development page.
                                                                      5. On the right of the page, click the Versions tab and view the version submission records. Select the versions to be compared and click Compare Version.

                                                                        If you select only one version, the selected version is compared with the JSON of the development-state job. If you select two versions, the JSON of the two versions is compared.

                                                                        +
                                                                        Figure 4 Comparing versions
                                                                    @@ -41,3 +37,10 @@
                                                                  + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0912.html b/docs/dataartsstudio/umn/dataartsstudio_01_0912.html index e35944106..28cce3e3e 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0912.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0912.html @@ -2,15 +2,15 @@

                                                                  Unlocking a Script

                                                                  Script and job unlocking depends on the lock function of DataArts Factory.

                                                                  -
                                                                  The lock function prevents conflict caused by collaborative script or job development. If you create or import a script or job, it is locked by you by default. You can only edit, save, or submit a script or job you have locked. To edit, save, or submit a script or job that is locked by another user or not locked by any user, you must lock the script or job first.
                                                                  • You can view the lock status of a script or job in the script or job directory tree.
                                                                  • To view the latest version of an opened script or job locked by another user, you need to re-open the script or job because it is not updated in real time.
                                                                  • Scripts or jobs that were created before the lock function was available are now unlocked by default. To edit, save, or submit these scripts or jobs, you need to lock them first.
                                                                  • The locking operation depends on the soft and hard lock policies. For details about how to configure soft and hard lock policies, see Configuring a Default Item.
                                                                    • Soft lock: You can lock or unlock jobs or scripts, regardless of whether they are locked by others.
                                                                    • Hard Lock: You can lock jobs or scripts only after they have been unlocked by other users. The space administrator and the DARTS Administrator can lock and unlock jobs or scripts without any limitations.
                                                                    +
                                                                    The lock function prevents conflict caused by collaborative script or job development. If you create or import a script or job, it is locked by you by default. You can only edit, save, or submit a script or job you have locked. To edit, save, or submit a script or job that is locked by another user or not locked by any user, you must lock the script or job first.
                                                                    • You can view the lock status of a script or job in the script or job directory tree.
                                                                    • To view the latest version of an opened script or job locked by another user, you need to re-open the script or job because it is not updated in real time.
                                                                    • Scripts or jobs that were created before the lock function was available are now unlocked by default. To edit, save, or submit these scripts or jobs, you need to lock them first.
                                                                    • The locking operation depends on the soft and hard lock policies. For details about how to configure soft and hard lock policies, see Configuring a Default Item.
                                                                      • Soft lock: You can lock or unlock jobs or scripts, regardless of whether they are locked by others.
                                                                      • Hard Lock: You can lock jobs or scripts only after they have been unlocked by other users. The space administrator and the DARTS Administrator user can lock and unlock jobs or scripts without any limitations.
                                                                    • Do not lock a script or job that is locked by another user because if you do so, changes to the script or job made by the user will be lost. If you want to modify the script or job, contact the user to unlock the script or job, and lock it by yourself.
                                                                    -
                                                                    Figure 1 Lock statuses
                                                                    +
                                                                    Figure 1 Lock statuses

                                                                    Prerequisites

                                                                    A script has been developed.

                                                                    Unlocking a Script

                                                                    If you submit a version, the latest script in the development state will be saved and submitted and overwrite the previous script version. You are advised to unlock the script after submitting the version so that other developers can modify the script as needed.

                                                                    -
                                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                    3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                    4. In the script directory, double-click the developed script to access the script development page.
                                                                    5. In the upper part of the script editor, click Unlock to unlock the script.

                                                                      Figure 2 Unlocking a script
                                                                      +
                                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                      3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                      4. In the script directory, double-click the developed script to access the script development page.
                                                                      5. In the upper part of the script editor, click Unlock to unlock the script.

                                                                        Figure 2 Unlocking a script

                                                                    @@ -21,3 +21,10 @@
                                                                  + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0913.html b/docs/dataartsstudio/umn/dataartsstudio_01_0913.html index 5814dd6f4..bd9258b9a 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0913.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_0913.html @@ -2,15 +2,15 @@

                                                                  Unlocking a Job

                                                                  Script and job unlocking depends on the lock function of DataArts Factory.

                                                                  -
                                                                  The lock function prevents conflict caused by collaborative script or job development. If you create or import a script or job, it is locked by you by default. You can only edit, save, or submit a script or job you have locked. To edit, save, or submit a script or job that is locked by another user or not locked by any user, you must lock the script or job first.
                                                                  • You can view the lock status of a script or job in the script or job directory tree.
                                                                  • To view the latest version of an opened script or job locked by another user, you need to re-open the script or job because it is not updated in real time.
                                                                  • Scripts or jobs that were created before the lock function was available are now unlocked by default. To edit, save, or submit these scripts or jobs, you need to lock them first.
                                                                  • The locking operation depends on the soft and hard lock policies. For details about how to configure soft and hard lock policies, see Configuring a Default Item.
                                                                    • Soft lock: You can lock or unlock jobs or scripts, regardless of whether they are locked by others.
                                                                    • Hard Lock: You can lock jobs or scripts only after they have been unlocked by other users. The space administrator and the DARTS Administrator can lock and unlock jobs or scripts without any limitations.
                                                                    +
                                                                    The lock function prevents conflict caused by collaborative script or job development. If you create or import a script or job, it is locked by you by default. You can only edit, save, or submit a script or job you have locked. To edit, save, or submit a script or job that is locked by another user or not locked by any user, you must lock the script or job first.
                                                                    • You can view the lock status of a script or job in the script or job directory tree.
                                                                    • To view the latest version of an opened script or job locked by another user, you need to re-open the script or job because it is not updated in real time.
                                                                    • Scripts or jobs that were created before the lock function was available are now unlocked by default. To edit, save, or submit these scripts or jobs, you need to lock them first.
                                                                    • The locking operation depends on the soft and hard lock policies. For details about how to configure soft and hard lock policies, see Configuring a Default Item.
                                                                      • Soft lock: You can lock or unlock jobs or scripts, regardless of whether they are locked by others.
                                                                      • Hard Lock: You can lock jobs or scripts only after they have been unlocked by other users. The space administrator and the DARTS Administrator user can lock and unlock jobs or scripts without any limitations.
                                                                    • Do not lock a script or job that is locked by another user because if you do so, changes to the script or job made by the user will be lost. If you want to modify the script or job, contact the user to unlock the script or job, and lock it by yourself.
                                                                    -
                                                                    Figure 1 Lock statuses
                                                                    +
                                                                    Figure 1 Lock statuses

                                                                    Prerequisites

                                                                    A job has been developed.

                                                                    Procedure

                                                                    If you submit a version, the latest job in the development state will be saved and submitted and overwrite the previous job version. You are advised to unlock the job after submitting the version so that other developers can modify the job as needed.

                                                                    -
                                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                    3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                    4. In the job directory, double-click the developed job to access the job development page.
                                                                    5. Above the job canvas or editor, click Unlock to unlock the job.

                                                                      Figure 2 Unlocking a job
                                                                      +
                                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                      3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                      4. In the job directory, double-click the developed job to access the job development page.
                                                                      5. Above the job canvas or editor, click Unlock to unlock the job.

                                                                        Figure 2 Unlocking a job

                                                                    @@ -21,3 +21,10 @@
                                                                  + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_0999.html b/docs/dataartsstudio/umn/dataartsstudio_01_0999.html deleted file mode 100644 index 8c07c2c70..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_0999.html +++ /dev/null @@ -1,80 +0,0 @@ - - -

                                                                  To Doris

                                                                  -

                                                                  Table 1 lists the destination job parameters when the destination link is a Doris link.

                                                                  - -
                                                                Table 5 Apache server log parsing result

                                                                Column Number

                                                                Example Value

                                                                +

                                                                Example Value

                                                                1

                                                                +

                                                                1

                                                                Mon Jan 08 20:43:51.854334 2018

                                                                +

                                                                Mon Jan 08 20:43:51.854334 2018

                                                                2

                                                                +

                                                                2

                                                                mpm_event:notice

                                                                +

                                                                mpm_event:notice

                                                                3

                                                                +

                                                                3

                                                                pid 36465:tid 140557517657856

                                                                +

                                                                pid 36465:tid 140557517657856

                                                                4

                                                                +

                                                                4

                                                                AH00489: Apache/2.4.12 (Unix) OpenSSL/1.0.1t configured -- resuming normal operations

                                                                +

                                                                AH00489: Apache/2.4.12 (Unix) OpenSSL/1.0.1t configured -- resuming normal operations

                                                                Data Lake Insight (DLI)

                                                                -

                                                                +

                                                                You must have the SELECT permission (for querying tables) on all fields of the DLI data source.

                                                                MRS ClickHouse

                                                                Data warehouse: MRS ClickHouse and Data Lake Insight (DLI)

                                                                • Recommended MRS ClickHouse version: 21.3.4.X
                                                                • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                  +
                                                                • Recommended MRS ClickHouse version: 21.3.4.X
                                                                • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                • Supported by local storage. Only MRS Hive and MRS Hudi are supported in storage-compute decoupling scenarios.
                                                                • Only MRS Hive is supported in Ranger scenarios.
                                                                • Not supported if SSL is enabled for ZooKeeper
                                                                • Recommended MRS HDFS versions:
                                                                  • 2.8.X
                                                                  • 3.1.X
                                                                • Recommended MRS HBase versions:
                                                                  • 2.1.X
                                                                  • 1.3.X
                                                                • MRS Hive and MRS Hudi 2.x versions are not supported. The following versions are recommended:
                                                                  • 1.2.X
                                                                  • 3.1.X
                                                                  -
                                                                • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                  +
                                                                • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                                                • Hadoop: MRS HDFS, MRS HBase, MRS Hive, and MRS Hudi
                                                                • Object storage: Object Storage Service (OBS)
                                                                • NoSQL: CloudTable
                                                                • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                                                • Search: Elasticsearch and Cloud Search Service (CSS)
                                                                • You are advised to use Data Replication Service (DRS) to migrate data between OLTP databases.
                                                                • Recommended Microsoft SQL Server version: 2005 or later
                                                                +
                                                                • Recommended Microsoft SQL Server version: 2005 or later
                                                                • Greenplum, Kingbase, and GaussDB can be connected using the PostgreSQL connector. The supported source and destination are the same as those of the PostgreSQL data source.

                                                                RDS for SQL Server

                                                                @@ -216,7 +216,7 @@
                                                                • Data warehouse: GaussDB(DWS) and Data Lake Insight (DLI)
                                                                • Hadoop: MRS HDFS, MRS HBase, and MRS Hive
                                                                • Object-based storage: Object Storage Service (OBS)
                                                                • Relational database: RDS for MySQL, RDS for PostgreSQL, and RDS for SQL Server
                                                                • NoSQL: CloudTable
                                                                • Search: Elasticsearch and Cloud Search Service (CSS)
                                                                • MRS Kafka cannot serve as the destination.
                                                                • Supported only by local storage and not in storage-compute decoupling scenarios.
                                                                • Not supported by Ranger.
                                                                • Not supported if SSL is enabled for ZooKeeper.
                                                                • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                  +
                                                                • MRS Kafka cannot serve as the destination.
                                                                • Supported only by local storage and not in storage-compute decoupling scenarios
                                                                • Not supported by Ranger
                                                                • Not supported if SSL is enabled for ZooKeeper
                                                                • MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                Entire DB migration only to MRS HBase

                                                                Recommended versions:
                                                                • 2.1.X
                                                                • 1.3.X
                                                                -

                                                                MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                +

                                                                MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                MRS Hive

                                                                @@ -292,7 +292,7 @@

                                                                Entire DB migration only to a relational database

                                                                2.x versions are not supported. The following versions are recommended:
                                                                • 1.2.X
                                                                • 3.1.X
                                                                -

                                                                MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                +

                                                                MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2 are not supported, and only MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1 are supported.

                                                                FusionInsight HBase

                                                                @@ -312,7 +312,7 @@

                                                                Not supported

                                                                Entire DB migration only to a relational database

                                                                -
                                                                2.x versions are not supported. The following versions are recommended:
                                                                • 1.2.X
                                                                • 3.1.X
                                                                +
                                                                2.x versions are not supported. The following versions are recommended:
                                                                • 1.2.X
                                                                • 3.1.X

                                                                Not supported

                                                                Entire DB migration only to a relational database

                                                                -
                                                                2.x versions are not supported. The following versions are recommended:
                                                                • 1.2.X
                                                                • 3.1.X
                                                                +
                                                                2.x versions are not supported. The following versions are recommended:
                                                                • 1.2.X
                                                                • 3.1.X
                                                                - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
                                                                Table 1 Parameter description

                                                                Type

                                                                -

                                                                Parameter

                                                                -

                                                                Description

                                                                -

                                                                Example Value

                                                                -

                                                                Basic parameters

                                                                -

                                                                Schema/Tablespace

                                                                -

                                                                Name of the database to which data will be written. The schema can be automatically created. Click the icon next to the text box to select a schema or tablespace.

                                                                -

                                                                schema

                                                                -

                                                                Table Name

                                                                -

                                                                Name of the table to which data will be written. Click the icon next to the text box. The dialog box for selecting the table is displayed.

                                                                -

                                                                This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                                                -
                                                                NOTE:

                                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Factory of DataArts Studio, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                                -
                                                                -

                                                                table

                                                                -

                                                                Clear Data Before Import

                                                                -
                                                                Whether to clear the data in the destination table before data import. The options are as follows:
                                                                • Do not clear: The data in the destination table is not cleared before data import. The imported data is just added to the table.
                                                                • Clear all data: All data is cleared from the destination table before data import.
                                                                • Clear part of data: Part of the data in the destination table is cleared before data import. If you select Clear part of data, you must configure WHERE Clause to specify which part will be deleted.
                                                                -
                                                                -

                                                                Clear part of data

                                                                -

                                                                WHERE Clause

                                                                -

                                                                If Clear Data Before Import is set to Clear part of data, data in the destination table will be deleted based on the WHERE clause after the configuration is complete and before the import starts.

                                                                -

                                                                age > 18 and age <= 60

                                                                -

                                                                Prepare for Data Import

                                                                -

                                                                The SQL statement that is first executed before a task is executed. Currently, only one SQL statement can be executed in wizard mode.

                                                                -

                                                                create temp table

                                                                -

                                                                Complete Statement After Data Import

                                                                -

                                                                The SQL statement that is executed after a task is executed. Currently, only one SQL statement can be executed.

                                                                -

                                                                merge into

                                                                -

                                                                Loader Threads

                                                                -

                                                                Number of threads started in each loader. A larger number allows more concurrent write operations. The unique model or aggregation function replace have requirements on the insertion sequence. When they are used, do not use the concurrency capability.

                                                                -

                                                                1

                                                                -
                                                                -
                                                                -
                                                              -
                                                              - -
                                                              - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1028.html b/docs/dataartsstudio/umn/dataartsstudio_01_1028.html index 160a0096e..0e834873e 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1028.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1028.html @@ -1,17 +1,25 @@ -

                                                              Creating DataArts Studio Instances

                                                              -
                                                              +

                                                              Creating and Configuring a DataArts Studio Instance

                                                              +
                                                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1096.html b/docs/dataartsstudio/umn/dataartsstudio_01_1096.html index 2c6c8ab06..2ecbbfebc 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1096.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1096.html @@ -1,9 +1,9 @@ -

                                                              Managing Cluster Configurations

                                                              +

                                                              Creating a Hadoop Cluster Configuration

                                                              On the Cluster Configurations page, you can create, edit, or delete Hadoop cluster configurations.

                                                              When creating a Hadoop link, the Hadoop cluster configurations can simplify the link creation. See Figure 1 for details.

                                                              -
                                                              Figure 1 Comparison before and after using the cluster configurations
                                                              +
                                                              Figure 1 Comparison before and after using the cluster configurations

                                                              CDM supports the following types of Hadoop links:

                                                              • MRS clusters: MRS HDFS, MRS HBase, and MRS Hive
                                                              • FusionInsight clusters: FusionInsight HDFS, FusionInsight HBase, and FusionInsight Hive
                                                              • Apache clusters: Apache HDFS, Apache HBase, and Apache Hive

                                                              Scenario

                                                              Before creating a Hadoop link, you are advised to create cluster configurations to simplify the link parameter configurations.

                                                              @@ -24,13 +24,13 @@
                                                              • MRS HDFS
                                                              • MRS HBase
                                                              • MRS Hive
                                                              • MRS Hudi
                                                              • MRS ClickHouse

                                                              For clusters of MRS 3.x:

                                                              -
                                                              1. Log in to FusionInsight Manager.
                                                              2. Choose Cluster > Name of the desired cluster > Dashboard > More > Download Client.
                                                              3. In the dialog box that is displayed, select Configuration Files Only. The platform type must be the same as that on the server. Retain the default values of other parameters and click OK to download the configuration file to the local host.
                                                              4. Obtain the downloaded TAR package, which is the FusionInsight cluster configuration file.
                                                              +
                                                              1. Log in to FusionInsight Manager.
                                                              2. Choose Cluster > Name of the desired cluster > Dashboard > More > Download Client.
                                                              3. In the dialog box that is displayed, select Configuration Files Only. The platform type must be the same as that on the server. Retain the default values of other parameters and click OK to download the configuration file to the local host.
                                                              4. Obtain the downloaded TAR package, which is the FusionInsight cluster configuration file.

                                                              For clusters of MRS 2.x or earlier:

                                                              1. Log in to the MRS console.
                                                              2. Choose Clusters > Active Clusters and click a cluster name to go to the cluster details page. Click the Components tab.
                                                              3. Click Download Client. Set Client Type to Only configuration files, set Download To to Server or Remote host, customize the client path, and click OK to generate the client configuration file.
                                                              4. Save the generated configuration file to a local path.

                                                              See MRS documentation for details.

                                                              For clusters of MRS 3.x:

                                                              -
                                                              1. Log in to FusionInsight Manager.
                                                              2. Choose System > Permission > User, locate the row that contains the target user, and choose More > Download Authentication Credential to download the authentication credential file.
                                                              3. Obtain the downloaded TAR package, which is the keytab file of the FusionInsight cluster.
                                                              +
                                                              1. Log in to FusionInsight Manager.
                                                              2. Choose System > Permission > User, locate the row that contains the target user, and choose More > Download Authentication Credential to download the authentication credential file.
                                                              3. Obtain the downloaded TAR package, which is the keytab file of the FusionInsight cluster.

                                                              For clusters of MRS 2.x or earlier:

                                                              1. Log in to MRS Manager and click System. In the Permission area, click Manage User.
                                                              2. In the row of the user for whom you want to export the keytab file, choose More > Download authentication credential to download the authentication file. After the file is automatically generated, save it to a specified path and keep it properly.

                                                              See MRS documentation for details.

                                                              @@ -39,10 +39,10 @@

                                                              FusionInsight clusters:

                                                              • FusionInsight HDFS
                                                              • FusionInsight HBase
                                                              • FusionInsight Hive
                                                              1. Log in to FusionInsight Manager.
                                                              2. Choose Cluster > Name of the desired cluster > Dashboard > More > Download Client.
                                                              3. In the dialog box that is displayed, select Configuration Files Only. The platform type must be the same as that on the server. Retain the default values of other parameters and click OK to download the configuration file to the local host.
                                                              4. Obtain the downloaded TAR package, which is the FusionInsight cluster configuration file.
                                                              +
                                                              1. Log in to FusionInsight Manager.
                                                              2. Choose Cluster > Name of the desired cluster > Dashboard > More > Download Client.
                                                              3. In the dialog box that is displayed, select Configuration Files Only. The platform type must be the same as that on the server. Retain the default values of other parameters and click OK to download the configuration file to the local host.
                                                              4. Obtain the downloaded TAR package, which is the FusionInsight cluster configuration file.

                                                              See the FusionInsight documentation for details.

                                                              1. Log in to FusionInsight Manager.
                                                              2. Choose System > Permission > User, locate the row that contains the target user, and choose More > Download Authentication Credential to download the authentication credential file.
                                                              3. Obtain the downloaded TAR package, which is the keytab file of the FusionInsight cluster.
                                                              +
                                                              1. Log in to FusionInsight Manager.
                                                              2. Choose System > Permission > User, locate the row that contains the target user, and choose More > Download Authentication Credential to download the authentication credential file.
                                                              3. Obtain the downloaded TAR package, which is the keytab file of the FusionInsight cluster.

                                                              See the FusionInsight documentation for details.

                                                              If you select this option, the node will not be executed, and a success message will be returned.

                                                              Task Groups

                                                              +

                                                              No

                                                              +

                                                              Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                              +
                                                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1099.html b/docs/dataartsstudio/umn/dataartsstudio_01_1099.html index 75d121890..e96446042 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1099.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1099.html @@ -44,7 +44,7 @@

                                                            No

                                                            If the associated SQL script uses a parameter, the parameter name is displayed. Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.

                                                            -

                                                            If the parameters of the associated SQL script are changed, click to refresh the parameters.

                                                            +

                                                            If the parameters of the associated SQL script are changed, click to refresh the parameters.

                                                            Node Name

                                                            @@ -112,6 +112,13 @@

                                                            If you select this option, the node will not be executed, and a success message will be returned.

                                                            Task Groups

                                                            +

                                                            No

                                                            +

                                                            Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                            +
                                                            @@ -142,17 +149,17 @@

                                                          Modify

                                                          Click to modify the parameter settings. After the modification, save the settings.

                                                          +

                                                          Click to modify the parameter settings. After the modification, save the settings.

                                                          Delete

                                                          Click to delete the parameter settings.

                                                          +

                                                          Click to delete the parameter settings.

                                                          View Details

                                                          Click to view details about the table created based on the input lineage.

                                                          +

                                                          Click to view details about the table created based on the input lineage.

                                                          Output

                                                          @@ -175,17 +182,17 @@

                                                          Modify

                                                          Click to modify the parameter settings. After the modification, save the settings.

                                                          +

                                                          Click to modify the parameter settings. After the modification, save the settings.

                                                          Delete

                                                          Click to delete the parameter settings.

                                                          +

                                                          Click to delete the parameter settings.

                                                          View Details

                                                          Click to view details about the table created based on the output lineage.

                                                          +

                                                          Click to view details about the table created based on the output lineage.

                                                          + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                          Table 1 Parameters

                                                          Parameter

                                                          +

                                                          Mandatory

                                                          +

                                                          Description

                                                          +

                                                          Node Name

                                                          +

                                                          Yes

                                                          +

                                                          Name of a node. The name must contain 1 to 128 characters, including only letters, numbers, underscores (_), hyphens (-), slashes (/), less-than signs (<), and greater-than signs (>).

                                                          +

                                                          By default, the node name is the same as that of the selected script. If you want the node name to be different from the script name, disable this function by referring to Disabling Auto Node Name Change.

                                                          +

                                                          SQL Script

                                                          +

                                                          Yes

                                                          +

                                                          Path of a script to be executed. If no script is available, create and develop a script by referring to Creating a Script and Developing an SQL Script.

                                                          +

                                                          Data Connection

                                                          +

                                                          Yes

                                                          +

                                                          Data connection that is configured in the SQL script. The value can be changed.

                                                          +

                                                          Database

                                                          +

                                                          Yes

                                                          +

                                                          Database that is configured in the SQL script. The value can be changed.

                                                          +

                                                          Resource Queue

                                                          +

                                                          No

                                                          +

                                                          Enter the resource queue name.

                                                          +

                                                          Script Parameter

                                                          +

                                                          No

                                                          +

                                                          If the associated SQL script uses a parameter, the parameter name is displayed. Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.

                                                          +

                                                          If the parameters of the associated SQL script are changed, click to refresh the parameters.

                                                          +
                                                          +
                                                          + +
                                                          + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                          Table 2 Advanced parameters

                                                          Parameter

                                                          +

                                                          Mandatory

                                                          +

                                                          Description

                                                          +

                                                          Node Status Polling Interval (s)

                                                          +

                                                          Yes

                                                          +

                                                          How often the system check completeness of the node. The value ranges from 1 to 60 seconds.

                                                          +

                                                          Max. Node Execution Duration

                                                          +

                                                          Yes

                                                          +

                                                          Execution timeout interval for the node. If retry is configured and the execution is not complete within the timeout interval, the node will be executed again.

                                                          +

                                                          Retry upon Failure

                                                          +

                                                          Yes

                                                          +

                                                          Whether to re-execute a node if it fails to be executed. Possible values:

                                                          +
                                                          • Yes: The node will be re-executed, and the following parameters must be configured:
                                                            • Retry upon Timeout
                                                            • Maximum Retries
                                                            • Retry Interval (seconds)
                                                            +
                                                          • No: The node will not be re-executed. This is the default setting.
                                                            NOTE:

                                                            If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                            +

                                                            If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                            +

                                                            Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                                            +
                                                            +
                                                          +

                                                          Policy for Handling Subsequent Nodes If the Current Node Fails

                                                          +

                                                          Yes

                                                          +

                                                          Operation that will be performed if the node fails to be executed. Possible values:

                                                          +
                                                          • Suspend execution plans of the subsequent nodes: stops running subsequent nodes. The job instance status is Failed.
                                                          • End the current job execution plan: stops running the current job. The job instance status is Failed.
                                                          • Go to the next node: ignores the execution failure of the current node. The job instance status is Failure ignored.
                                                          • Suspend the current job execution plan: If the current job instance is in abnormal state, the subsequent nodes of this node and the subsequent job instances that depend on the current job are in waiting state.
                                                          +

                                                          Enable Dry Run

                                                          +

                                                          No

                                                          +

                                                          If you select this option, the node will not be executed, and a success message will be returned.

                                                          +

                                                          Task Groups

                                                          +

                                                          No

                                                          +

                                                          Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                          +
                                                          +
                                                          + +
                                                          + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                          Table 3 Lineage

                                                          Parameter

                                                          +

                                                          Description

                                                          +

                                                          Input

                                                          +

                                                          Add

                                                          +

                                                          Click Add. In the Type drop-down list, select the type to be created. The value can be DWS, OBS, CSS, HIVE, DLI, or CUSTOM.

                                                          +

                                                          OK

                                                          +

                                                          Click OK to save the parameter settings.

                                                          +

                                                          Cancel

                                                          +

                                                          Click Cancel to cancel the parameter settings.

                                                          +

                                                          Modify

                                                          +

                                                          Click to modify the parameter settings. After the modification, save the settings.

                                                          +

                                                          Delete

                                                          +

                                                          Click to delete the parameter settings.

                                                          +

                                                          View Details

                                                          +

                                                          Click to view details about the table created based on the input lineage.

                                                          +

                                                          Output

                                                          +

                                                          Add

                                                          +

                                                          Click Add. In the Type drop-down list, select the type to be created. The value can be DWS, OBS, CSS, HIVE, DLI, or CUSTOM.

                                                          +

                                                          OK

                                                          +

                                                          Click OK to save the parameter settings.

                                                          +

                                                          Cancel

                                                          +

                                                          Click Cancel to cancel the parameter settings.

                                                          +

                                                          Modify

                                                          +

                                                          Click to modify the parameter settings. After the modification, save the settings.

                                                          +

                                                          Delete

                                                          +

                                                          Click to delete the parameter settings.

                                                          +

                                                          View Details

                                                          +

                                                          Click to view details about the table created based on the output lineage.

                                                          +
                                                          +
                                                          +
                                                        + +
                                                        + +
                                                        + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1105.html b/docs/dataartsstudio/umn/dataartsstudio_01_1105.html index 18da6f67c..890662188 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1105.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1105.html @@ -4,11 +4,11 @@

                                                        This section describes how to view the execution history of scripts, jobs, and nodes over a week.

                                                        Prerequisites

                                                        This function depends on OBS buckets. For details about how to configure OBS buckets, see Configuring an OBS Bucket.

                                                        -

                                                        Script Execution History

                                                        1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                        2. In the navigation pane of the DataArts Factory homepage, choose Data Development > Develop Script.
                                                        3. Above the directory, click to display the script and job execution history in the past seven days.
                                                        4. Select Scripts from the drop-down list box to filter out the script execution history.
                                                        5. Click a record to view the script information and execution result.
                                                        6. Download the historic script execution result.
                                                          • By default, all users can download the historic execution results of scripts.
                                                          • You can click Download on the Result tab page.
                                                          • You can download the result file in CSV format. A maximum of 1,000 results can be queried and downloaded.
                                                          +

                                                          Script Execution History

                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          3. In the navigation pane of the DataArts Factory homepage, choose Data Development > Develop Script.
                                                          4. Above the directory, click to display the script and job execution history in the past seven days.
                                                          5. Select Scripts from the drop-down list box to filter out the script execution history.
                                                          6. Click a record to view the script information and execution result.
                                                          7. Download the historic script execution result.
                                                            • By default, all users can download the historic execution results of scripts.
                                                            • You can click Download on the Result tab page.
                                                            • You can download the result file in CSV format. A maximum of 1,000 results can be queried and downloaded.
                                                          -

                                                          Job Execution History

                                                          1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                          2. In the left navigation pane of DataArts Factory, choose Data Development > Develop Job.
                                                          3. Above the directory, click to display the script and job execution history in the past seven days.
                                                          4. Select Jobs from the drop-down list box to filter out the job execution history.
                                                          5. Click a record to view the job and log information.

                                                            If only some nodes of the job were tested, the execution history only displays information and logs for these nodes.

                                                            +

                                                            Job Execution History

                                                            1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            2. In the left navigation pane of DataArts Factory, choose Data Development > Develop Job.
                                                            3. Above the directory, click to display the script and job execution history in the past seven days.
                                                            4. Select Jobs from the drop-down list box to filter out the job execution history.
                                                            5. Click a record to view the job and log information.

                                                              If only some nodes of the job were tested, the execution history only displays information and logs for these nodes.

                                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1106.html b/docs/dataartsstudio/umn/dataartsstudio_01_1106.html index 3b1aa57c0..74dec88b1 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1106.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1106.html @@ -4,7 +4,7 @@

                                                            The execution history of scripts, jobs, and nodes is stored in OBS buckets. If no OBS bucket is available, you cannot view the execution history. This section describes how to configure an OBS bucket.

                                                            Constraints

                                                            The OBS path is only supported for OBS buckets and not for parallel file systems.

                                                            -

                                                            Procedure

                                                            1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            2. In the navigation pane, choose Configuration > Configure.
                                                            3. Choose OBS Bucket.
                                                            4. Select an OBS bucket.

                                                              Figure 1 Configuring an OBS bucket
                                                              +

                                                              Procedure

                                                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              3. In the navigation pane, choose Configuration > Configure.
                                                              4. Choose OBS Bucket.
                                                              5. Select an OBS bucket.

                                                                Figure 1 Configuring an OBS bucket

                                                              6. Click Save.
                                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1107.html b/docs/dataartsstudio/umn/dataartsstudio_01_1107.html index bb0d49c90..1b5291981 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1107.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1107.html @@ -2,8 +2,10 @@

                                                            Unlocking Scripts

                                                            This section describes how to unlock scripts in batches.

                                                            -

                                                            Procedure

                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                            2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                            4. Click in the script directory and select Show Check Box.
                                                              Figure 1 Clicking Show Check Box
                                                              -
                                                            5. Select the scripts to unlock, click , and select Batch Unlock. The message "Unlocked." is displayed.
                                                              Figure 2 Batch Unlock
                                                              +

                                                              Procedure

                                                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                              4. Click in the script directory and select Show Check Box.
                                                                Figure 1 Clicking Show Check Box
                                                                +

                                                                +
                                                              5. Select the scripts to unlock, click , and select Batch Unlock. The message "Unlocked." is displayed.
                                                                Figure 2 Batch Unlock
                                                                +

                                                            @@ -13,3 +15,10 @@
                                                            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1108.html b/docs/dataartsstudio/umn/dataartsstudio_01_1108.html index 47ac8cb99..da8adfae1 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1108.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1108.html @@ -2,7 +2,7 @@

                                                            Unlocking Jobs

                                                            This section describes how to unlock jobs in batches.

                                                            -

                                                            Procedure

                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                            2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                            3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                            4. Click in the job directory and select Show Check Box.
                                                            5. Select the jobs to unlock, click , and select Batch Unlock. The message "Unlocked." is displayed.
                                                              Figure 1 Batch Unlock
                                                              +

                                                              Procedure

                                                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                              2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                              3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                              4. Click in the job directory and select Show Check Box.
                                                              5. Select the jobs to unlock, click , and select Batch Unlock. The message "Unlocked." is displayed.
                                                                Figure 1 Batch Unlock

                                                              @@ -13,3 +13,10 @@
                                                            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1203.html b/docs/dataartsstudio/umn/dataartsstudio_01_1203.html index 72785b495..33350f06f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1203.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1203.html @@ -536,7 +536,7 @@

                                                        exportJobTags

                                                        Import a tag from OBS

                                                        +

                                                        Importing a tag from OBS

                                                        tag

                                                        Use Agent

                                                        Whether to extract data from the data source through an agent

                                                        +

                                                        The agent function will be unavailable soon and does not need to be configured.

                                                        Yes

                                                        +

                                                        -

                                                        Agent

                                                        Click Select and select the agent created in Managing Agents.

                                                        +

                                                        The agent function will be unavailable soon and does not need to be configured.

                                                        -

                                                        (Optional) Displayed when you click Show Advanced Attributes.

                                                        Number of records submitted each time. Set this parameter based on the data destination and the job's data size. If the value is either too large or too small, the job may run for a long time.

                                                        -

                                                        +

                                                        10000

                                                        SSL Encryption

                                                        (Optional) Whether to connect to the database using SSL. This parameter is available for a MySQL link.

                                                        +

                                                        (Optional) Whether to connect to the database using SSL. This parameter is available for a MySQL link.

                                                        Yes

                                                        Link Attributes

                                                        (Optional) Click Add to add the JDBC connector attributes of multiple specified data sources. For details, see the JDBC connector document of the corresponding database.

                                                        -
                                                        The following are some examples:
                                                        • connectTimeout=600000 and socketTimeout=300000: When a large amount of data needs to be migrated or the entire table is retrieved using query statements, the migration fails due to connection timeout. In this case, you can customize the connection timeout interval (ms) and socket timeout interval (ms) to prevent failures caused by timeout.
                                                        • tinyInt1isBit=false or mysql.bool.type.transform=false: By default, tinyInt1isBit is true, indicating that TINYINT(1) is processed as a bit, that is, Types.BOOLEAN, and 1 or 0 is read as true or false. As a result, the migration fails. In this case, you can set tinyInt1isBit to false to avoid migration failures.
                                                        • useCursorFetch=false: By default, useCursorFetch is enabled, indicating that the JDBC connector communicates with relational databases using a binary protocol. Some third-party systems may have compatibility issues, causing migration time conversion errors. In this case, you can disable this function. Open-source MySQL databases support the useCursorFetch parameter, and you do not need to set this parameter.
                                                        • allowPublicKeyRetrieval=true: By default, public key retrieval is disabled for MySQL databases. If TLS is unavailable and an RSA public key is used for encryption, connection to an MySQL database may fail. In this case, you can enable public key retrieval to avoid connection failures.
                                                        +
                                                        The following are some examples:
                                                        • connectTimeout=600000 and socketTimeout=300000: When a large amount of data needs to be migrated or the entire table is retrieved using query statements, the migration fails due to connection timeout. In this case, you can customize the connection timeout interval (ms) and socket timeout interval (ms) to prevent failures caused by timeout.
                                                        • tinyInt1isBit=true (default): If the length of tinyInt is 1, the value is converted to a Boolean value. tinyInt1isBit=false: The value is converted to an integer.

                                                          If data fails to be written because true or false is read from the source, set this parameter to false to avoid migration errors. For details, see MySQL Documentation.

                                                          +
                                                        • useCursorFetch=false: By default, useCursorFetch is enabled, indicating that the JDBC connector communicates with relational databases using a binary protocol. Some third-party systems may have compatibility issues, causing migration time conversion errors. In this case, you can disable this function. Open-source MySQL databases support the useCursorFetch parameter, and you do not need to set this parameter.
                                                        • allowPublicKeyRetrieval=true: By default, public key retrieval is disabled for MySQL databases. If TLS is unavailable and an RSA public key is used for encryption, connection to an MySQL database may fail. In this case, you can enable public key retrieval to avoid connection failures.
                                                        • useSSL=false: Enable SSL encryption using this attribute when the CDM cluster version is 2.10.0.300 and the MySQL version is later than 5.7.43.

                                                        sslmode=require

                                                        @@ -148,7 +149,7 @@
                                                        diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1212.html b/docs/dataartsstudio/umn/dataartsstudio_01_1212.html index 953190a8d..d150b7fd8 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1212.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1212.html @@ -1,6 +1,6 @@ -

                                                        Link to an Oracle Database

                                                        +

                                                        Oracle Database Link Parameters

                                                        Table 1 lists the parameters for a link to an Oracle database.

                                                        Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

                                                        @@ -71,14 +71,14 @@

                                                        Use Agent

                                                        Whether to extract data from the data source through an agent

                                                        +

                                                        The agent function will be unavailable soon and does not need to be configured.

                                                        Yes

                                                        +

                                                        -

                                                        Agent

                                                        Click Select and select the agent created in Managing Agents.

                                                        +

                                                        The agent function will be unavailable soon and does not need to be configured.

                                                        -

                                                        Later than 12.1

                                                        Fetch Size

                                                        -

                                                        (Optional) Displayed when you click Show Advanced Attributes.

                                                        -

                                                        Number of rows obtained by each request. Set this parameter based on the data source and the job's data size. If the value is either too large or too small, the job may run for a long time.

                                                        -

                                                        A migration from the Oracle to DWS database may time out due to a long data write duration in the DWS database. In this case, reduce the value of Fetch Size for the Oracle database.

                                                        -

                                                        1000

                                                        -

                                                        Link Attributes

                                                        -

                                                        (Optional) Click Add to add the JDBC connector attributes of multiple specified data sources. For details, see the JDBC connector document of the corresponding database.

                                                        -
                                                        The following are some examples:
                                                        • oracle.net.CONNECT_TIMEOUT=60000 and oracle.jdbc.ReadTimeout=300000: When a large amount of data needs to be migrated or the entire table is retrieved using query statements, the migration fails due to connection timeout. In this case, you can customize the connection timeout interval (ms) and read timeout interval (ms) to prevent failures caused by timeout.
                                                        -
                                                        -

                                                        sslmode=require

                                                        -

                                                        Reference Sign

                                                        +

                                                        Reference Sign

                                                        (Optional) Delimiter between the names of the referenced tables or columns. For details, see the product documentation of the corresponding database.

                                                        "

                                                        Driver Version

                                                        +

                                                        Driver Version

                                                        Different types of relational databases adapt to different drivers. For details, see How Do I Obtain a Driver?

                                                        -

                                                        Fetch Size

                                                        +

                                                        (Optional) Displayed when you click Show Advanced Attributes.

                                                        +

                                                        Number of rows obtained by each request. Set this parameter based on the data source and the job's data size. If the value is either too large or too small, the job may run for a long time.

                                                        +

                                                        A migration from the Oracle to DWS database may time out due to a long data write duration in the DWS database. In this case, reduce the value of Fetch Size for the Oracle database.

                                                        +

                                                        1000

                                                        +

                                                        Commit Size

                                                        +

                                                        (Optional) Displayed when you click Show Advanced Attributes.

                                                        +

                                                        Number of rows submitted in a batch

                                                        +

                                                        10000

                                                        +

                                                        Link Attributes

                                                        +

                                                        This parameter is optional. You can click Add to add custom attributes for the link.

                                                        +

                                                        The following are some examples:

                                                        +
                                                        • oracle.net.CONNECT_TIMEOUT: connection timeout, in milliseconds. The default value is 60000.
                                                        • oracle.jdbc.ReadTimeout: socket read timeout, in milliseconds. The default value is 300000.
                                                        +

                                                        60000

                                                        +

                                                        Link Secret Attributes

                                                        +

                                                        (Optional) Displayed when you click Show Advanced Attributes.

                                                        +

                                                        Custom secret attributes of the link

                                                        +

                                                        sk=09fUgD5WOF1L6f

                                                        +
                                                        @@ -129,7 +145,7 @@
                                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1214.html b/docs/dataartsstudio/umn/dataartsstudio_01_1214.html index 884e8562f..631f79992 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1214.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1214.html @@ -1,6 +1,6 @@ -

                                                      Link to a Database Shard

                                                      +

                                                      Shard Link Parameters

                                                      Sharding refers to the link to multiple backend data sources at the same time. The link can be used as the job source to migrate data from multiple data sources to other data sources. Table 1 lists the link parameters.

                                                      Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

                                                      @@ -37,14 +37,14 @@

                                                      Use Agent

                                                      Whether to extract data from the data source through an agent

                                                      +

                                                      The agent function will be unavailable soon and does not need to be configured.

                                                      Yes

                                                      +

                                                      -

                                                      Agent

                                                      Click Select and select the agent created in Managing Agents.

                                                      +

                                                      The agent function will be unavailable soon and does not need to be configured.

                                                      -

                                                      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
                                                      Table 1 Doris link parameters

                                                      Parameter

                                                      -

                                                      Description

                                                      -

                                                      Example Value

                                                      -

                                                      Name

                                                      -

                                                      Link name, which should be defined based on the data source type, so it is easier to remember what the link is for

                                                      -

                                                      Doris_link

                                                      -

                                                      Database Server

                                                      -

                                                      One or more server lists (server domain names/IP addresses) separated by semicolons (;)

                                                      -
                                                      NOTE:
                                                      • For the open-source Doris, enter the server domain names or IP addresses.
                                                      • For MRS Doris, log in to Manager of the cluster where the MRS Doris data source is located, choose Cluster > Services > Doris > Instance, and view the MRS Doris service IP address.
                                                      -
                                                      -

                                                      192.168.0.1;192.168.0.2

                                                      -

                                                      Port

                                                      -

                                                      Port of the database to connect

                                                      -
                                                      NOTE:
                                                      • For the open-source Doris, enter the server domain names or IP addresses.
                                                      • For MRS Doris, log in to Manager of the cluster where the MRS Doris data source is located, choose Cluster > Services > Doris > Configurations > Basic Configurations, and view the MRS Doris service IP address.

                                                        DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                        -
                                                      -
                                                      -

                                                      9030

                                                      -

                                                      Database Name

                                                      -

                                                      Name of the database to connect

                                                      -

                                                      dbname

                                                      -

                                                      Username

                                                      -

                                                      Username used for accessing the database This account must have the permissions required to read and write data tables and metadata.

                                                      -

                                                      cdm

                                                      -

                                                      Password

                                                      -

                                                      Password of the user

                                                      -

                                                      -

                                                      -

                                                      Use Agent

                                                      -

                                                      Whether to extract data from the data source through an agent

                                                      -

                                                      Yes

                                                      -

                                                      Agent

                                                      -

                                                      Click Select and select the agent created in Managing Agents.

                                                      -

                                                      -

                                                      -

                                                      Fetch Size

                                                      -

                                                      (Optional) Displayed when you click Show Advanced Attributes.

                                                      -

                                                      Number of rows obtained by each request. Set this parameter based on the data source and the job's data size. If the value is either too large or too small, the job may run for a long time.

                                                      -

                                                      1000

                                                      -

                                                      Commit Size

                                                      -

                                                      (Optional) Displayed when you click Show Advanced Attributes.

                                                      -

                                                      Number of records submitted each time. Set this parameter based on the data destination and the job's data size. If the value is either too large or too small, the job may run for a long time.

                                                      -

                                                      -

                                                      -

                                                      Link Attributes

                                                      -

                                                      (Optional) Click Add to add the JDBC connector attributes of multiple specified data sources. For details, see the JDBC connector document of the corresponding database.

                                                      -

                                                      The following are some examples:

                                                      -

                                                      connectTimeout=600000 and socketTimeout=300000: When a large amount of data needs to be migrated or the entire table is retrieved using query statements, the migration fails due to connection timeout. In this case, you can customize the connection timeout interval (ms) and socket timeout interval (ms) to prevent failures caused by timeout.

                                                      -

                                                      sslmode=require

                                                      -

                                                      Reference Sign

                                                      -

                                                      (Optional) Delimiter between the names of the referenced tables or columns. For details, see the product documentation of the corresponding database.

                                                      -

                                                      `

                                                      -
                                                      -
                                                      -
                                                    -
                                                    - -
                                                    - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1251.html b/docs/dataartsstudio/umn/dataartsstudio_01_1251.html index 636493e13..0013df60a 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1251.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1251.html @@ -33,7 +33,7 @@

                                                    Name of the table to which data will be written. Click the icon next to the text box. The dialog box for selecting the table is displayed.

                                                    This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                                    -
                                                    NOTE:

                                                    If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                    +
                                                    NOTE:

                                                    If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                    table

                                                    @@ -89,10 +89,10 @@

                                                    Extending field length

                                                    When Auto creation is selected, the length of the character fields can be extended to three times the original length and then written to the destination table. If the encoding types of the source and destination databases are different, but the character fields in the source and destination tables are the same, errors may occur during data migration due to character length difference.

                                                    -

                                                    When a character field containing Chinese characters is imported to DWS, the length of the character field must be automatically increased by three times.

                                                    +

                                                    When Auto creation is selected, the length of the character fields can be extended to four times the original length and then written to the destination table. If the encoding types of the source and destination databases are different, but the character fields in the source and destination tables are the same, errors may occur during data migration due to character length difference.

                                                    +

                                                    When a character field containing Chinese characters is imported to DWS, the length of the character field must be automatically increased by four times.

                                                    If a job fails to be executed and an error message similar to value too long for type character varying exists in the log when you import Chinese characters to DWS, you can enable this function to solve the problem.

                                                    -
                                                    NOTE:

                                                    When this function is enabled, some fields consume three times the storage space of the user.

                                                    +
                                                    NOTE:

                                                    When this function is enabled, some fields consume four times the storage space of the user.

                                                    No

                                                    @@ -130,7 +130,7 @@

                                                    Field Mapping in Automatic Table Creation on DWS

                                                    Figure 1 describes the field mapping between DWS tables created by CDM and source tables. For example, if you use CDM to migrate the Oracle database to DWS, CDM automatically creates a table on DWS and maps the NUMBER(3,0) field of the Oracle database to the SMALLINT field of DWS.

                                                    -
                                                    Figure 1 Field mapping in automatic table creation
                                                    +
                                                    Figure 1 Field mapping in automatic table creation

                                                    Indexes cannot be created in automatic table creation scenarios.

                                                    @@ -138,7 +138,14 @@
                                                    + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1254.html b/docs/dataartsstudio/umn/dataartsstudio_01_1254.html index 0e7b169ed..441636f75 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1254.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1254.html @@ -21,8 +21,8 @@

                                                SQL Statement

                                                When Use SQL Statement is set to Yes, enter an SQL statement here. CDM exports data based on the SQL statement.

                                                -
                                                NOTE:
                                                • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                                • With statements are not supported.
                                                • Comments, such as -- and /*, are not supported.
                                                • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                                  • load data
                                                  • delete from
                                                  • alter table
                                                  • create table
                                                  • drop table
                                                  • into outfile
                                                  -
                                                +
                                                NOTE:
                                                • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                                • With statements are not supported.
                                                • Comments, such as -- and /*, are not supported.
                                                • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                                  • load data
                                                  • delete from
                                                  • alter table
                                                  • create table
                                                  • drop table
                                                  • into outfile
                                                  +
                                                • If the SQL statement is too long, the request fails to be delivered. If you continue to create a job, the system displays an error message indicating that the request is incorrect. In this case, you need to simplify or clear the SQL statement and try again.

                                                select id,name from sqoop.user;

                                                @@ -43,7 +43,7 @@

                                                If the desired table is not displayed, check whether the table exists or whether the login account has the permission to query metadata.

                                                This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                                This parameter can be set to a regular expression to export all databases that meet the rule. For example, if Table Name is set to user_[0-9]{1,2}, tables from user_0 to user_9 and from user_00 to user_99 are matched.

                                                -
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                +
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                table

                                                @@ -63,12 +63,19 @@

                                                WHERE clause used to specify the data extraction range. This parameter is displayed when Use SQL Statement is set to No. If this parameter is not set, the entire table is extracted.

                                                You can set a date macro variable to extract data generated on a specific date.

                                                -
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                +
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                DS='${dateformat(yyyy-MM-dd,-1,DAY)}'

                                                Retain One Decimal Place for Date Values

                                                +

                                                Whether to retain one decimal place for date values

                                                +

                                                Yes

                                                +

                                                Null in Partition Column

                                                Whether the partition column can contain null values

                                                @@ -127,7 +134,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1255.html b/docs/dataartsstudio/umn/dataartsstudio_01_1255.html index 527487e1c..29bdf7a6f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1255.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1255.html @@ -21,8 +21,8 @@

                                                SQL Statement

                                                When Use SQL Statement is set to Yes, enter an SQL statement here. CDM exports data based on the SQL statement.

                                                -
                                                NOTE:
                                                • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                                • With statements are not supported.
                                                • Comments, such as -- and /*, are not supported.
                                                • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                                  • load data
                                                  • delete from
                                                  • alter table
                                                  • create table
                                                  • drop table
                                                  • into outfile
                                                  -
                                                +
                                                NOTE:
                                                • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                                • With statements are not supported.
                                                • Comments, such as -- and /*, are not supported.
                                                • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                                  • load data
                                                  • delete from
                                                  • alter table
                                                  • create table
                                                  • drop table
                                                  • into outfile
                                                  +
                                                • If the SQL statement is too long, the request fails to be delivered. If you continue to create a job, the system displays an error message indicating that the request is incorrect. In this case, you need to simplify or clear the SQL statement and try again.

                                                select id,name from sqoop.user;

                                                @@ -44,7 +44,7 @@

                                                Name of the table from which data will be extracted. This parameter is displayed when Use SQL Statement is set to No. Click the icon next to the text box to go to the page for selecting the table or directly enter a table name.

                                                If the desired table is not displayed, check whether the table exists or whether the login account has the permission to query metadata.

                                                This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                                -
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                +
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                NOTE:
                                                The table name can contain wildcard characters (*), which is used to export all tables whose names start with a certain prefix or end with a certain suffix. The number and types of fields in the tables must be the same. The examples are as follows:
                                                • table* indicates that all tables whose names starting with table are exported.
                                                • *table indicates that all tables whose names ending with table are exported.
                                                • *table* indicates that all tables whose names containing table are exported.
                                                @@ -67,7 +67,7 @@

                                                WHERE clause used to specify the data extraction range. This parameter is displayed when Use SQL Statement is set to No. If this parameter is not set, the entire table is extracted.

                                                You can set a date macro variable to extract data generated on a specific date.

                                                -
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                +
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                DS='${dateformat(yyyy-MM-dd,-1,DAY)}'

                                                @@ -141,7 +141,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1256.html b/docs/dataartsstudio/umn/dataartsstudio_01_1256.html index 46be1d201..e207a2bf2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1256.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1256.html @@ -30,7 +30,7 @@

                                                If the desired table is not displayed, check whether the table exists or whether the login account has the permission to query metadata.

                                                This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                                This parameter can be set to a regular expression to export all databases that meet the rule.

                                                -
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                +
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                table

                                                @@ -42,7 +42,7 @@

                                                Specifies the data extraction range. If this parameter is not set, the entire table is extracted.

                                                You can set a date macro variable to extract data generated on a specific date.

                                                -
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                +
                                                NOTE:

                                                If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                DS='${dateformat(yyyy-MM-dd,-1,DAY)}'

                                                @@ -57,7 +57,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1280.html b/docs/dataartsstudio/umn/dataartsstudio_01_1280.html index 0ae6e07da..07969c7bb 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1280.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1280.html @@ -4,7 +4,7 @@

                                                This section describes how to configure the maximum number of job nodes that can run concurrently in a workspace.

                                                Constraints

                                                The number of concurrently running nodes in the workspace cannot exceed that in the instance.

                                                -

                                                Procedure

                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                3. In the navigation pane, choose Configuration > Configure.
                                                4. Choose Nodes Concurrently Running.
                                                5. Set Nodes Concurrently Running in the Workspace. Ensure that the value is less than or equal to the maximum number of nodes that can run concurrently in the DataArts Studio instance.

                                                  Table 1 lists the maximum number of nodes that can run concurrently in the DataArts Studio instance. To view the quota of the job node scheduling times per day, click More of a DataArts Studio instance and select Quota Usage.

                                                  +

                                                  Procedure

                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                  2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                  3. In the navigation pane, choose Configuration > Configure.
                                                  4. Choose Nodes Concurrently Running.
                                                  5. Set Nodes Concurrently Running in the Workspace. Ensure that the value is less than or equal to the maximum number of nodes that can run concurrently in the DataArts Studio instance.

                                                    Table 1 lists the maximum number of nodes that can run concurrently in the DataArts Studio instance. To view the quota of the job node scheduling times per day, click More of a DataArts Studio instance and select Quota Usage.

                                                    @@ -45,7 +45,7 @@
                                                    Table 1 Maximum number of nodes that can run concurrently in a DataArts Studio instance

                                                    Job Node Scheduling Times/Day of a DataArts Studio Instance

                                                    -
                                                    Figure 1 Configuring the number of concurrently running nodes
                                                    +
                                                    Figure 1 Configuring the number of concurrently running nodes

                                                  6. Click Save.
                                                  @@ -60,3 +60,10 @@
                                                + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1282.html b/docs/dataartsstudio/umn/dataartsstudio_01_1282.html index 01149ba86..6d1544289 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1282.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1282.html @@ -1,15 +1,15 @@

                                                Configuring a Template

                                                -

                                                This section describes how to create and use a Flink SQL template. When writing Flink SQL code, you can use an SQL template for repeated service logic. In addition, you can use a job parameter template when configuring job parameters.

                                                +

                                                This section describes how to create and use a template. When writing code, you can use an SQL template for repeated service logic. In addition, you can use a job parameter template when configuring job parameters.

                                                Constraints

                                                This function applies to the following scenarios:

                                                -
                                                • Use a script template for a Flink SQL script.
                                                • During pipeline job development, use a Fink SQL script which uses a script template for the MRS Flink Job node and use a parameter template for Program Parameter of the MRS Flink Job node.
                                                • Use a script template in a single-task Flink SQL job.
                                                • Use template parameters in a single-task Flink JAR job.
                                                +
                                                • Use a script template for a Flink SQL script.
                                                • During pipeline job development, use a Fink SQL script which uses a script template for the MRS Flink Job node and use a parameter template for Program Parameter of the MRS Flink Job node.
                                                • Use a script template in a single-task Flink SQL job.
                                                • Use template parameters in a single-task Flink JAR job.
                                                • You can use parameter templates for Spark SQL and Hive SQL scripts and single-task jobs. For details about how to use a template, see Configuring a Default Item.
                                                -

                                                Procedure

                                                1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                2. In the navigation pane, choose Configuration > Configure.
                                                3. Choose Templates.

                                                  • Create a script template.
                                                    1. On the Script Templates page, click Add.
                                                    2. Set Template Name.
                                                    3. Enter an SQL statement and reference script parameters.
                                                    4. Configure the script template parameters. The parameter names cannot be changed, and the parameter values can be changed.
                                                      Figure 1 Creating a script template
                                                      +

                                                      Procedure

                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                      3. In the navigation pane, choose Configuration > Configure.
                                                      4. Choose Templates.

                                                        • Create a script template.
                                                          1. On the Script Templates page, click Add.
                                                          2. Set Template Name.
                                                          3. Enter an SQL statement and reference script parameters.
                                                          4. Configure the script template parameters. The parameter names cannot be changed, and the parameter values can be changed.
                                                            Figure 1 Creating a script template

                                                          5. Click Save.

                                                            You can view, modify, or delete the created script template.

                                                          -
                                                        • Create a parameter template.
                                                          1. On the Parameter Templates page, click Add.
                                                          2. Set Template Name.
                                                          3. Click Add Parameter and set parameter names and values. You can modify or delete parameters.
                                                            Figure 2 Creating a parameter template
                                                            +
                                                          4. Create a parameter template.
                                                            1. On the Parameter Templates page, click Add.
                                                            2. Set Template Name.
                                                            3. Click Add Parameter Set parameter names and values. You can modify or delete parameters.

                                                            4. Click OK.

                                                              You can view, modify, or delete the created parameter template.

                                                              For details about the application scenarios of script templates and parameter templates, see Using Script Templates and Parameter Templates.

                                                              @@ -24,3 +24,10 @@
                                                + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1283.html b/docs/dataartsstudio/umn/dataartsstudio_01_1283.html index 501c78f11..4bd99a483 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1283.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1283.html @@ -1,17 +1,19 @@

                                                Configuring a Scheduling Calendar

                                                -

                                                You can configure a scheduling calendar and specify the working days for scheduling a job.

                                                +
                                                • You can configure a scheduling calendar and specify the working days for scheduling a job.
                                                • After creating a scheduling calendar, you can go to the DataArts Factory console, open a job, click Scheduling Setup, select Run periodically for Scheduling Type, and select the calendar you have created for Scheduling Calendar. A dry run is performed beyond the calendar, and the job is executed normally within the calendar range.

                                                  If the scheduling calendar function is used, the system checks whether the planned execution time of a job instance is a working day during data job scheduling or patching.

                                                  +
                                                  • If the planned execution time of the instance is a working day in the calendar, the instance is executed normally.
                                                  • If the planned execution time of the instance is not a working day in the calendar, a dry run is performed.
                                                  +
                                                  +

                                                Constraints

                                                This function is available for batch processing jobs but not for real-time processing jobs.

                                                -

                                                Procedure

                                                1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                2. In the left navigation pane, choose Configuration > Configure.
                                                3. Choose Scheduling Calendars.
                                                4. Click Add. The Create Scheduling Calendar dialog box is displayed.

                                                  Figure 1 Create Scheduling Calendar dialog box
                                                  -

                                                  -

                                                5. Set parameters for the scheduling calendar.

                                                  Set Calendar Name, Owner, Default Working Days, and Description.

                                                  +

                                                  Procedure

                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                  2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                  3. In the left navigation pane, choose Configuration > Configure.
                                                  4. Choose Scheduling Calendars.
                                                  5. Click Add. The Create Scheduling Calendar dialog box is displayed.

                                                    Figure 1 Create Scheduling Calendar dialog box
                                                    +

                                                  6. Set parameters for the scheduling calendar.

                                                    Set Calendar Name, Default Working Days, and Description.

                                                    You can select Mon to Fri or Mon to Sun for Default Working Days. By default, Mon to Fri is selected.

                                                    -

                                                  7. Click OK.

                                                    After creating the calendar, you can use it for jobs. Go to the DataArts Factory console, open a job, click Scheduling Setup, select Run periodically for Scheduling Type, and select the calendar you have created for Scheduling Calendar.

                                                    +

                                                  8. Click OK.

                                                    After creating the calendar, you can use it for jobs. Go to the DataArts Factory console, open a job, click Scheduling Setup, select Run periodically for Scheduling Type, and select the calendar you have created for Scheduling Calendar. A dry run is performed beyond the calendar, and the job is executed normally within the calendar range.

                                                  -

                                                  More Operations

                                                  • Modify a calendar: Click Modify in the Operation column.
                                                    • Batch Select: Select all Mondays to Fridays of the current month.
                                                    • Invert Selection: Select all non-working days.
                                                    • Clear: Clear selected working days.
                                                      Figure 2 Modifying a scheduling calendar
                                                      +

                                                      More Operations

                                                      • Modify a calendar: Click Modify in the Operation column.
                                                        • Batch Select: Select all Mondays to Fridays of the current month.
                                                        • Invert Selection: Select all non-working days.
                                                        • Clear: Clear selected working days.
                                                          Figure 2 Modifying a scheduling calendar

                                                      • Delete a calendar: Click Delete in the Operation column.
                                                      @@ -23,3 +25,10 @@
                                                  + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1284.html b/docs/dataartsstudio/umn/dataartsstudio_01_1284.html index 21dbb3438..66f5d746e 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1284.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1284.html @@ -2,35 +2,31 @@

                                                  Configuring Task Groups

                                                  By configuring a task group, you can control the maximum number of concurrent nodes in a task group in a more fine-grained manner.

                                                  -

                                                  Constraints

                                                  This function is available only for batch processing jobs.

                                                  -

                                                  Task groups cannot be used across workspaces.

                                                  +

                                                  Constraints

                                                  • This function is available only for batch processing jobs.
                                                  • Task groups cannot be used across workspaces.
                                                  • For a pipeline job, you can configure a task group for each node or for the job. A task group configured for a node is prior to one configured for the job.
                                                  -

                                                  Procedure

                                                  1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                  2. In the left navigation pane, choose Configuration > Configure.
                                                  3. Choose Task Groups.
                                                  4. Click Create.
                                                  5. In the displayed dialog box, set required parameters.

                                                    -

                                                    Table 1 Parameters for creating a task group

                                                    Parameter

                                                    +

                                                    Procedure

                                                    1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                    2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                    3. In the left navigation pane, choose Configuration > Configure.
                                                    4. Choose Task Groups.
                                                    5. Click Create.
                                                    6. In the displayed dialog box, set required parameters.

                                                      +

                                                      - - - - - - - - - - @@ -39,7 +35,7 @@

                                                    7. Click OK.

                                                      After the task group is created, go to the job development page. On the canvas of a job, click Scheduling Setup and select the created task group. Then the number of concurrent nodes in the current task group can be controlled in a more fine-grained manner based on the selected task group.

                                                    8. -

                                                      Follow-up Operations

                                                      Modifying a task group: Locate a task group and click Modify in the Operation column.

                                                      +

                                                      Follow-up Operations

                                                      Modifying a task group: Locate a task group and click Modify in the Operation column. The modification takes effect immediately.

                                                      Deleting a task group: Locate a task group and click Delete in the Operation column. A task group used by a job cannot be deleted.

                                                      Viewing references: Locate a task group and click View Reference in the Operation column to view the jobs that are using the task group.

                                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1299.html b/docs/dataartsstudio/umn/dataartsstudio_01_1299.html index ecf117316..bbf34f66f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1299.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1299.html @@ -1,21 +1,23 @@ -

                                                      Creating a Data Connection

                                                      +

                                                      Creating a DataArts Studio Data Connection

                                                      You can create data connections by configuring data sources. Based on the data connections of the Management Center, DataArts Studio performs data development, governance, services, and operations on the data lake base.

                                                      After the data connection between the development environment and production environment is configured, the data connection in the development environment in the script or job during data development is automatically switched to the data connection in the production environment after the process is released.

                                                      -

                                                      Constraints

                                                      • RDS data connections depend on OBS. If OBS is unavailable in the same region as DataArts Studio, RDS data connections are not supported.
                                                      • For host connections, only Linux hosts are supported.
                                                      • If changes occur in the connected data lake (for example, the MRS cluster capacity is expanded), you need to edit and save the connection.
                                                      • If the data lake authentication information in a data connection changes (for example, the password expires), the data connection becomes invalid. Ensure that the data lake authentication information is permanently valid to prevent any loss caused by connection failures.
                                                      -
                                                      -

                                                      Prerequisites

                                                      • You have created a data lake to connect, for example, a database or cloud service supported by DataArts Studio.
                                                        • Before creating a DWS data connection, ensure that you have created a cluster in DWS and have the permissions required to view Key Management Service (KMS) keys.
                                                        • Before creating an MRS connection such as an MRS HBase and MRS Hive connection, ensure that you have created an MRS cluster and selected required components.
                                                        -
                                                      • The data lake to connect communicates with the DataArts Studio instance properly.
                                                        • If the data lake is an on-premises database, a public network or a dedicated connection is required. Ensure that the host where the data source is located can access the public network and the port has been enabled in the firewall rule.
                                                        • If the data lake is a cloud service (such as DWS and MRS), the following requirements must be met for network interconnection:
                                                          • If the CDM cluster in the DataArts Studio instance and the cloud service are in different regions, a public network or a dedicated connection is required.
                                                          • If the CDM cluster in the DataArts Studio instance and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                          • The cloud service instance and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                          +

                                                          Constraints

                                                          • RDS data connections depend on OBS. If OBS is unavailable in the same region as DataArts Studio, RDS data connections are not supported.
                                                          • For host connections, only Linux hosts are supported.
                                                          • If changes occur in the connected data lake (for example, the MRS cluster capacity is expanded), you need to edit and save the connection.
                                                          • If the data lake authentication information in a data connection changes (for example, the password expires), the data connection becomes invalid. Ensure that the data lake authentication information is permanently valid to prevent any loss caused by connection failures.
                                                          • DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                            +
                                                          • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                          -
                                                        • If the enterprise mode is used, pay attention to the following points:
                                                          In enterprise mode, the development environment and production environment need to be distinguished. Therefore, you need to prepare two sets of data lake services for the production environment and development environment to isolate the development environment from the production environment.
                                                          • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, DIS, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a Data Connection.
                                                          • For serverless services (such as DLI), DataArts Studio configures the mapping between data lake services in the production environment and development environment through environment isolation in the management center. The corresponding data lake is automatically switched during the development and production processes. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.
                                                          • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                          +
                                                          +

                                                          Prerequisites

                                                          • You have created a data lake to connect, for example, a database or cloud service supported by DataArts Studio.
                                                            • Before creating a DWS data connection, ensure that you have created a cluster in DWS and have the permissions required to view Key Management Service (KMS) keys.
                                                            • Before creating an MRS connection such as an MRS HBase or MRS Hive connection, ensure that you have created an MRS cluster whose Kerberos encryption type is aes256-sha1,aes128-sha1, and that the cluster contains required components.
                                                            +
                                                          • You have obtained the required agent (CDM cluster). If no CDM cluster is available, create one by referring to Creating a CDM Cluster. The CDM cluster can communicate with the data lake to be connected.
                                                            • If the data lake is an on-premises database, you need the Internet or Direct Connect. Ensure that the host where the data source is located and the CDM cluster can access the Internet, and the connection port has been enabled in the firewall rule.
                                                            • If the data lake is a cloud service (such as DWS and MRS), the following requirements must be met for network interconnection:
                                                              • If the CDM cluster and the cloud service are in different regions, a public network or a dedicated connection is required for enabling communication between the CDM cluster and the cloud service.
                                                              • If the CDM cluster and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                              • The cloud service instance and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                              +
                                                            +
                                                          • If the enterprise mode is used, pay attention to the following points:
                                                            In enterprise mode, the development environment and production environment need to be distinguished. Therefore, you need to prepare two sets of data lake services for the production environment and development environment to isolate the development environment from the production environment.
                                                            • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a DataArts Studio Data Connection.
                                                            • For serverless services (such as DLI), DataArts Studio configures the mapping between data lake services in the production environment and development environment through environment isolation in the management center. The corresponding data lake is automatically switched during the development and production processes. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.
                                                            • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                            • Offline processing migration jobs are not supported in enterprise mode.

                                                            For example, if your data lake service is an MRS cluster, you need to prepare two MRS clusters with the same version, specifications, components, region, VPC, and subnet. If some configurations of an MRS cluster are modified, you also need to synchronize the modifications to the other MRS cluster.

                                                          -

                                                          Creating a Data Connection

                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                          2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                          3. On the displayed Manage Data Connections page, click Create Data Connection.

                                                            Figure 1 Creating a data connection
                                                            +

                                                            Creating a Data Connection

                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                            2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                            3. On the displayed Manage Data Connections page, click Create Data Connection.

                                                              Figure 1 Creating a data connection

                                                              -

                                                            4. On the displayed page, select a data connection type and configure the parameters listed in Table 1.

                                                              • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, DIS, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a Data Connection.
                                                              • For serverless services (such as DLI), DataArts Studio configures the mapping between data lake services in the production environment and development environment through environment isolation in the management center. The corresponding data lake is automatically switched during the development and production processes. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.
                                                              • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                              +

                                                            5. On the displayed page, select a data connection type and configure the parameters listed in Table 1.

                                                              • If two clusters are used for clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services. The versions, specifications, components, regions, VPCs, subnets, and related configurations of the two sets of data lake services must be the same. For details on how to create data connections, see Creating a DataArts Studio Data Connection.
                                                              • For serverless services (such as DLI), DataArts Studio configures the mapping between data lake services in the production environment and development environment through environment isolation in the management center. The corresponding data lake is automatically switched during the development and production processes. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.
                                                              • For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments. For details, see DB configuration.
                                                              • Offline processing migration jobs are not supported in enterprise mode.
                                                      Table 1 Parameters for creating a task group

                                                      Parameter

                                                      Description

                                                      +

                                                      Description

                                                      Task Group Name

                                                      +

                                                      Task Group Name

                                                      Name of the task group

                                                      +

                                                      Name of the task group. It must be unique.

                                                      Owner

                                                      +

                                                      Maximum number of concurrency

                                                      Owner of the task group

                                                      +

                                                      Maximum number of concurrent job nodes in the current task group

                                                      +

                                                      The maximum number of concurrent nodes is the current number of concurrent DataArts Studio instances.

                                                      +

                                                      The value cannot exceed the maximum number of concurrent nodes of the DataArts Studio instance, which is 1,000.

                                                      +

                                                      The maximum number of concurrent nodes varies depending on the DataArts Studio instance specifications.

                                                      Maximum number of concurrency

                                                      +

                                                      Description

                                                      Maximum number of concurrent job nodes in the current task group

                                                      -

                                                      The maximum number of concurrent nodes is the current number of concurrent DataArts Studio instances.

                                                      -

                                                      Description

                                                      -

                                                      Description of the task group

                                                      +

                                                      Description of the task group

                                                      - - - - - - - - - - - + + + - - - - + + + + + + + + + @@ -102,7 +124,7 @@

                                                      Related Operations

                                                      • Edit a data connection: In the data connection list, locate a connection and click Edit in the Operation column. On the displayed page, modify the parameters listed in Table 1 as needed.

                                                        If you do not want to change the password, you do not need to set it. The system automatically uses the password set when the connection was created.

                                                        -

                                                        Click Test to check whether the data connection is normal. If the connection is normal, click Save. If the connection is abnormal, the data connection cannot be created. Modify the connection parameters as prompted and try again.

                                                        +

                                                        Click Test to check whether the data connection is normal. If the connection is normal, click Save. If the connection is abnormal, the data connection cannot be created. Modify the connection parameters as prompted and try again.

                                                      • Delete a data connection: In the data connection list, locate a connection and click Delete in the Operation column. In the displayed dialog box, confirm the data connection information, and click OK.
                                                        If the connection to be deleted is being used, it cannot be deleted directly. In this case, you need to stop the connection from being used on the console of each component and try again.

                                                        If a data connection is deleted, the data table information of the data connection will also be deleted. Exercise caution when performing this operation.

                                                        @@ -111,7 +133,14 @@
                                                      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1300.html b/docs/dataartsstudio/umn/dataartsstudio_01_1300.html index 6e6ab3f24..8b366f93d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1300.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1300.html @@ -1,6 +1,6 @@ -

                                                      Configuring a DWS Connection

                                                      +

                                                      DWS Connection Parameters

                                                      Table 1 Data connection parameters

                                                      Data Connection Type

                                                      @@ -24,75 +26,95 @@

                                                      DWS

                                                      +

                                                      GaussDB(DWS)

                                                      See Configuring a DWS Connection.

                                                      +

                                                      See DWS Connection Parameters.

                                                      DLI

                                                      See Configuring a DLI Connection.

                                                      +

                                                      See DLI Connection Parameters.

                                                      MRS Hive

                                                      See Configuring an MRS Hive Connection.

                                                      +

                                                      See MRS Hive Connection Parameters.

                                                      MRS HBase

                                                      See Configuring an MRS HBase Connection.

                                                      +

                                                      See MRS HBase Connection Parameters.

                                                      MRS Kafka

                                                      See Configuring an MRS Kafka Connection.

                                                      +

                                                      See MRS Kafka Connection Parameters.

                                                      MRS Spark

                                                      See Configuring an MRS Spark Connection.

                                                      +

                                                      See MRS Spark Connection Parameters.

                                                      MRS ClickHouse

                                                      See Configuring an MRS ClickHouse Connection.

                                                      +

                                                      See MRS ClickHouse Connection Parameters.

                                                      MRS Hetu

                                                      See Configuring an MRS Hetu Connection.

                                                      +

                                                      See MRS Hetu Connection Parameters.

                                                      MRS Impala

                                                      See Configuring an MRS Impala Connection.

                                                      +

                                                      See MRS Impala Connection Parameters.

                                                      MRS Doris

                                                      See Configuring an MRS Doris Connection.

                                                      +

                                                      See Doris Connection Parameters.

                                                      +

                                                      OpenSource ClickHouse

                                                      +

                                                      See OpenSource ClickHouse Connection Parameters.

                                                      RDS

                                                      See Configuring an RDS Connection.

                                                      +

                                                      See RDS Connection Parameters.

                                                      The RDS connection can connect to relational databases such as RDS for MySQL, PostgreSQL, DM, SQL Server, and SAP HANA.

                                                      MySQL (pending offline)

                                                      You are not advised to select this connection type. Instead, You are advised to select RDS. For details, see Configuring an RDS Connection.

                                                      +

                                                      You are not advised to select this connection type. Instead, You are advised to select RDS. For details, see RDS Connection Parameters.

                                                      Oracle

                                                      See Configuring an Oracle Connection.

                                                      +

                                                      See Oracle Connection Parameters.

                                                      Host Connection

                                                      See Configuring a Host Connection.

                                                      +

                                                      See Host Connection Parameters.

                                                      +

                                                      Rest Client

                                                      +

                                                      See Rest Client Connection Parameters.

                                                      +

                                                      Redis

                                                      +

                                                      See Redis Connection Parameters.

                                                      +

                                                      SAP HANA

                                                      +

                                                      See SAP HANA Connection Parameters.

                                                      @@ -38,7 +38,6 @@ - @@ -88,15 +91,17 @@ - - @@ -124,7 +129,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1301.html b/docs/dataartsstudio/umn/dataartsstudio_01_1301.html index bc0e6fc2d..17c9de8f2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1301.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1301.html @@ -1,6 +1,6 @@ -

                                                      Configuring a DLI Connection

                                                      +

                                                      DLI Connection Parameters

                                                      Table 1 DWS connection

                                                      Parameter

                                                      Yes

                                                      Select the modules for which this connection is available.

                                                      -

                                                      All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                      Basic and Network Connectivity Configuration

                                                      @@ -48,7 +47,8 @@

                                                      Yes

                                                      DWS supports SSL encryption and certificate authentication for communication between the client and server. You can use SSL Connection to set the communication mode. If SSL Connection is enabled, only SSL encryption can be used. If SSL Connection is disabled, both modes can be used. This function is disabled by default.

                                                      +
                                                      DWS supports SSL encryption and certificate authentication for communication between the client and server. You can set this parameter based on whether SSL connection is mandatory on the server.
                                                      • If this parameter is enabled, only SSL encryption can be used for communication.
                                                      • If this parameter is disabled, both SSL encryption and certificate authentication can be used for communication.
                                                      +

                                                      Manual

                                                      @@ -57,6 +57,8 @@

                                                      Select either of the following modes:

                                                      • Cluster Name Mode: Select an existing cluster.
                                                      • Connection String Mode: Enter the IP address/domain name and port of the corresponding cluster and enable the communication between the connection's agent (CDM cluster) and the DWS cluster.
                                                      +
                                                      NOTE:

                                                      DataArts Security does not support GaussDB(DWS) connections in connection string mode.

                                                      +

                                                      DWS Cluster Name

                                                      @@ -72,6 +74,7 @@

                                                      Yes

                                                      This parameter is mandatory when Manual is set to Connection String Mode.

                                                      +

                                                      If you choose to manually enter an IP address or domain name, you must enter an internal IP address and a port that is accessible to the network segment of the resource group. Otherwise, the network is disconnected.

                                                      This parameter indicates the address for accessing the cluster database through an internal network. Enter an IP address or domain name. The IP address or domain name is automatically generated during cluster creation. You can obtain them on the management console by performing the following operations:
                                                      1. Log in to the GaussDB(DWS) console.
                                                      2. In the left navigation pane, choose Instances.
                                                      3. Click the name of an instance to enter the basic information page. In the Connection Information area, you can obtain the private IP address, domain name, and port number.

                                                      Yes

                                                      KMS key used to encrypt and decrypt the authentication information for the data source

                                                      +
                                                      KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                      NOTE:
                                                      • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                      • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                      +
                                                      +

                                                      Agent

                                                      Yes

                                                      Data Warehouse Service (DWS) is not a fully managed service and thus cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating a DWS data connection. If no CDM cluster is available, create one first.

                                                      -

                                                      As a network proxy, the CDM cluster must be able to communicate with the DWS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the DWS cluster. The security group rule must also allow the CDM cluster communicate with the DWS cluster.

                                                      +

                                                      Data Warehouse Service (DWS) is not a fully managed service and thus cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating a DWS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                      +

                                                      As a network proxy, the CDM cluster must be able to communicate with the DWS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the DWS cluster. The security group rule must also allow the CDM cluster communicate with the DWS cluster.

                                                      NOTE:

                                                      If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                      @@ -38,7 +38,19 @@ + + + + + + @@ -47,7 +59,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1302.html b/docs/dataartsstudio/umn/dataartsstudio_01_1302.html index cb285364e..8b3c87874 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1302.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1302.html @@ -1,6 +1,6 @@ -

                                                      Configuring an Oracle Connection

                                                      +

                                                      Oracle Connection Parameters

                                                      Table 1 DLI connection

                                                      Parameter

                                                      Yes

                                                      Select the modules for which this connection is available.

                                                      -

                                                      All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                      +

                                                      Basic and Network Connectivity Configuration

                                                      +

                                                      Project ID

                                                      +

                                                      No

                                                      +

                                                      This parameter is displayed when DataArts Migration is selected for Applicable Modules.

                                                      +

                                                      Project ID in the region where DLI resides

                                                      +
                                                      A project is a group of tenant resources, and an account ID corresponds to the current account. The IAM ID corresponds to the current user. You can view the project IDs, account IDs, and user IDs in different regions on the corresponding pages.
                                                      1. Register with and log in to the management console.
                                                      2. Hover the cursor on the username in the upper right corner and select My Credentials from the drop-down list.
                                                      3. On the API Credentials page, obtain the account name, account ID, IAM username, and IAM user ID, and obtain the project and its ID from the project list.
                                                      +
                                                      @@ -38,7 +38,6 @@ - - -
                                                      Table 1 Oracle connection

                                                      Parameter

                                                      Yes

                                                      Select the modules for which this connection is available.

                                                      -

                                                      All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                      Basic and Network Connectivity Configuration

                                                      @@ -62,17 +61,17 @@

                                                      Yes

                                                      KMS key used to encrypt and decrypt the authentication information for the data source

                                                      +
                                                      KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                      NOTE:
                                                      • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                      • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                      +
                                                      +

                                                      Agent

                                                      Yes

                                                      Oracle is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an Oracle data connection. If no CDM cluster is available, create one through the DataArts Migration incremental package.

                                                      +

                                                      DataArts Studio cannot be directly connected to non-fully managed services. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an Oracle data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                      As a network proxy, the CDM cluster must be able to communicate with Oracle.

                                                      -
                                                      NOTE:

                                                      If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                      -

                                                      Data Source Authentication and Other Function Configuration

                                                      @@ -133,7 +132,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1303.html b/docs/dataartsstudio/umn/dataartsstudio_01_1303.html index c2b0cb964..c1175a933 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1303.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1303.html @@ -1,7 +1,7 @@ -

                                                      Configuring an RDS Connection

                                                      -

                                                      You can create connections to RDS databases including MySQL, PostgreSQL, SQL Server, SAP HANA, and DM databases.

                                                      +

                                                      RDS Connection Parameters

                                                      +

                                                      RDS connections can be used to connect to MySQL, PostgreSQL, and SQL Server databases.

                                                      @@ -39,7 +39,6 @@ - @@ -67,27 +67,36 @@ - - - + + + + @@ -99,12 +108,19 @@
                                                      • com.mysql.jdbc.Driver: Select this driver name for RDS for MySQL or MySQL.
                                                      • org.postgresql.Driver: Select this driver name for RDS for PostgreSQL or PostgreSQL.
                                                      • com.microsoft.sqlserver.jdbc.SQLServerDriver: Select this driver name for RDS for SQL Server.
                                                      • com.huawei.opengauss.jdbc.Driver: Select this driver name for RDS for GaussDB.
                                                      + + + + @@ -132,7 +148,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1305.html b/docs/dataartsstudio/umn/dataartsstudio_01_1305.html index ed31f30ab..5c2431920 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1305.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1305.html @@ -1,6 +1,6 @@ -

                                                      Configuring a Host Connection

                                                      +

                                                      Host Connection Parameters

                                                      Table 1 RDS connection

                                                      Parameter

                                                      Yes

                                                      Select the modules for which this connection is available.

                                                      -

                                                      All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                      Basic and Network Connectivity Configuration

                                                      @@ -49,7 +48,8 @@

                                                      Yes

                                                      Address for accessing the relational database data source. The value can be an IP address or a domain name.

                                                      +

                                                      Address for accessing the relational database data source. The value can be an IP address or a domain name.

                                                      +

                                                      If you choose to manually enter an IP address or domain name, you must enter an internal IP address and a port that is accessible to the network segment of the resource group. Otherwise, the network is disconnected.

                                                      • If the data source is RDS, you can obtain the address on the management console by performing the following operations:
                                                        1. Log in to the management console of the corresponding cloud service using the account you have obtained.
                                                        2. In the left navigation pane, choose Instances.
                                                        3. Click the name of an instance to enter the basic information page. In the Connection Information area, you can obtain the private IP address, domain name, and port number.
                                                      • If the data source is MySQL, PostgreSQL, or DM, you can obtain the access address from the database administrator.

                                                      Yes

                                                      GaussDB cluster mode. This parameter is available when Driver Name is set to com.huawei.opengauss.jdbc.Driver.

                                                      -
                                                      • Active/Standby
                                                      • Distributed
                                                      +

                                                      GaussDB cluster mode. This parameter is available when Driver Name is set to com.huawei.opengauss.jdbc.Driver.

                                                      +
                                                      • Primary/Standby
                                                      • Distributed

                                                      KMS Key

                                                      Yes

                                                      KMS key used to encrypt and decrypt the authentication information for the data source

                                                      +
                                                      KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                      NOTE:
                                                      • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                      • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                      +
                                                      +

                                                      Agent

                                                      Yes

                                                      RDS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an RDS data connection. If no CDM cluster is available, create one first.

                                                      -

                                                      As a network proxy, the CDM cluster must be able to communicate with RDS. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as RDS. The security group rule must also allow the CDM cluster to communicate with RDS.

                                                      +

                                                      RDS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an RDS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                      +

                                                      As a network proxy, the CDM cluster must be able to communicate with RDS. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as RDS. The security group rule must also allow the CDM cluster to communicate with RDS.

                                                      NOTE:

                                                      If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                      SSL Encryption

                                                      +

                                                      No

                                                      +

                                                      Whether to enable SSL encrypted transmission.

                                                      +

                                                      Data Source Driver Configuration

                                                      Driver file source

                                                      +

                                                      Yes

                                                      +

                                                      Select the source of the driver file.

                                                      +

                                                      Driver File Path

                                                      Yes

                                                      It specifies the OBS path where the driver file is located. You need to download a .jar driver file from the corresponding official website and upload it to OBS.

                                                      - +
                                                      NOTE:
                                                      • The OBS path of the driver file cannot contain Chinese characters.
                                                      • To update the driver, you must restart the CDM cluster in DataArts Migration and then edit the data connection to upload the driver.
                                                      @@ -38,7 +38,6 @@ - @@ -75,7 +74,9 @@ - @@ -136,7 +137,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1306.html b/docs/dataartsstudio/umn/dataartsstudio_01_1306.html index ae7c8c752..f21ba2d22 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1306.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1306.html @@ -1,6 +1,6 @@ -

                                                      Configuring an MRS Hive Connection

                                                      +

                                                      MRS Hive Connection Parameters

                                                      Table 1 Host Connection parameters

                                                      Parameter

                                                      Yes

                                                      Select the modules for which this connection is available.

                                                      -

                                                      All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                      Basic and Network Connectivity Configuration

                                                      @@ -56,9 +55,9 @@

                                                      Yes

                                                      CDM cluster used as an agent.

                                                      +

                                                      CDM cluster used as an agent. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                      NOTE:
                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                        -
                                                      • When scheduling shell or Python scripts, the agent accesses the ECS. If shell and Python scripts are scheduled frequently, the ECS adds the private IP address of the agent to the blocklist. To ensure normal job scheduling, you are advised to use the root user of the ECS to add the private IP address bound to the agent (CDM cluster) to the /etc/hosts.allow file.

                                                        For details about how to obtain the private IP address of the CDM cluster, see Viewing Basic Cluster Information and Modifying Cluster Configurations.

                                                        +
                                                      • When scheduling shell or Python scripts, the agent accesses the ECS. If shell and Python scripts are scheduled frequently, the ECS adds the private IP address of the agent to the blocklist. To ensure normal job scheduling, you are advised to use the root user of the ECS to add the private IP address bound to the agent (CDM cluster) to the /etc/hosts.allow file.

                                                        For details about how to obtain the private IP address of the CDM cluster, see Viewing and Modifying CDM Cluster Configurations.

                                                      Yes

                                                      KMS key used to encrypt and decrypt the authentication information for the data source

                                                      +
                                                      KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                      NOTE:
                                                      • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                      • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                      +
                                                      +

                                                      Data Source Authentication and Other Function Configuration

                                                      @@ -101,8 +102,8 @@

                                                      Yes

                                                      This parameter is available only when Login Mode is set to Key Pair.

                                                      -

                                                      If Key Pair is the login mode of the host, you need to obtain the private key file, upload it to OBS, and select an OBS path.

                                                      -
                                                      NOTE:

                                                      The uploaded private key must match the public key configured on the host. For details, see "Passwords and Key Pairs" > "Key Pairs" > "Application Scenarios for Using Key Pairs" in Elastic Cloud Server User Guide.

                                                      +

                                                      If Key Pair is the login mode of the host, you need to obtain the private key file, upload it to OBS, and select an OBS path.

                                                      +
                                                      NOTE:

                                                      The uploaded private key must match the public key configured on the host. For details, see "Passwords and Key Pairs" > "Key Pairs" > "Application Scenarios for Using Key Pairs" in Elastic Cloud Server User Guide.

                                                      @@ -37,8 +37,7 @@ - @@ -83,10 +82,12 @@ @@ -95,17 +96,20 @@ - @@ -162,21 +166,65 @@

                                                      Enter the password configured when LDAP authentication was enabled for MRS Hive.

                                                      + + + + + + + + + + + + + + + + + + +
                                                      Table 1 MRS Hive connection

                                                      Parameter

                                                      Yes

                                                      Select the modules for which this connection is available. The connection can be used in the selected modules.

                                                      -

                                                      All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                      +

                                                      Select the modules for which this connection is available.

                                                      Basic and Network Connectivity Configuration

                                                      @@ -73,7 +72,7 @@
                                                      Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                      NOTE:

                                                      DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                      -

                                                      You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to the Management Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                      +

                                                      You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to an MRS Cluster Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                      Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                      • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                      • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.

                                                      Yes

                                                      This parameter is mandatory when MRS API connection is selected for Connection Type or Cluster Name Mode is selected for Manual.

                                                      -

                                                      The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.

                                                      -
                                                      NOTE:

                                                      DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                      +
                                                      The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                                      NOTE:

                                                      DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                      +
                                                      +
                                                      +
                                                      If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                      • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                      • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                      • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                      +
                                                      NOTE:

                                                      If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                                      -
                                                      If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                      • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                      • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                      • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.

                                                      No

                                                      This parameter is mandatory when Connection Type is set to Proxy connection.

                                                      -

                                                      KMS key used to encrypt and decrypt the authentication information for the data source

                                                      +
                                                      KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                      NOTE:
                                                      • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                      • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                      +
                                                      +

                                                      Agent

                                                      Yes

                                                      This parameter is mandatory when Connection Type is set to Proxy connection.

                                                      -

                                                      MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first.

                                                      -

                                                      As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the MRS cluster. The security group rule must also allow the CDM cluster communicate with the MRS cluster.

                                                      -
                                                      NOTE:
                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster cannot connect to multiple MRS security clusters. You are advised to plan multiple agents which are mapped to MRS security clusters one by one.
                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.
                                                      +

                                                      This parameter is mandatory when Connection Type is set to Proxy connection.

                                                      +

                                                      MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                      +

                                                      As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the MRS cluster. The security group rule must also allow the CDM cluster to communicate with the MRS cluster.

                                                      +
                                                      NOTE:
                                                      • If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                        +

                                                      OBS storage support

                                                      +

                                                      No

                                                      +

                                                      This parameter is displayed when DataArts Migration is selected for Applicable Modules.

                                                      +

                                                      The server must support OBS storage. When creating a Hive table, you can store the table in OBS.

                                                      +

                                                      Use Agency

                                                      +

                                                      No

                                                      +

                                                      This parameter is displayed when DataArts Migration is selected for Applicable Modules.

                                                      +

                                                      If you enable the agency function, you can create a data connection without having a permanent AK/SK and execute CDM jobs using the scheduling identity configured in DataArts Factory.

                                                      +

                                                      Public agency

                                                      +

                                                      No

                                                      +

                                                      This parameter is displayed when DataArts Migration is selected for Applicable Modules and Use Agency is enabled.

                                                      +

                                                      The agency is only used to check whether the connection agency function is normal. CDM jobs will be executed using the scheduling identity configured in DataArts Factory.

                                                      +

                                                      AK

                                                      +

                                                      N/A

                                                      +

                                                      This parameter is displayed when DataArts Migration is selected for Applicable Modules and OBS storage support is enabled.

                                                      +

                                                      AK and SK are used to log in to the OBS server.

                                                      +

                                                      You need to create an access key for the current account and obtain an AK/SK pair.

                                                      +
                                                      To obtain an access key, perform the following steps:
                                                      1. Log in to the management console, move the cursor to the username in the upper right corner, and select My Credentials from the drop-down list.
                                                      2. On the My Credentials page, choose Access Keys, and click Create Access Key. See Figure 1.
                                                        Figure 1 Clicking Create Access Key
                                                        +
                                                      3. Click OK and save the access key file as prompted. The access key file will be saved to your browser's configured download location. Open the credentials.csv file to view Access Key Id and Secret Access Key.
                                                        NOTE:
                                                        • Only two access keys can be added for each user.
                                                        • To ensure access key security, the access key is automatically downloaded only when it is generated for the first time and cannot be obtained from the management console later. Keep them properly.
                                                        +
                                                        +
                                                      +
                                                      +

                                                      +

                                                      SK

                                                      +

                                                      N/A

                                                      +

                                                      Creating a Kerberos Authentication User for an MRS Security Cluster

                                                      To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                      For clusters of MRS 3.x:

                                                      1. Log in to MRS Manager as user admin.
                                                      2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                        • Set Password Policy Name to neverexp.
                                                        • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                        • Set Password Expiration Notification (Days) to 0.
                                                        • Retain the default values for other parameters.
                                                        -
                                                      3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                        • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                        • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                        +
                                                      4. Choose System > Permission > User. On the page displayed, click Create to add a dedicated human-machine user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                        • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                        • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                      5. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                      6. Synchronize IAM users.
                                                        1. Log in to the MRS console.
                                                        2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                        3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                          • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                          • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.

                                                      For clusters of MRS 2.x or earlier:

                                                      -
                                                      1. Log in to MRS Manager as user admin.
                                                      2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                        • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                        • Set Password Expiration Notification (Days) to 0.
                                                        • Retain the default values for other parameters.
                                                        -
                                                      3. Choose System > Manage User. On the page displayed, add a dedicated user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                        • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                        +
                                                        1. Log in to the MRS Manager as user admin.
                                                        2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                          • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                          • Set Password Expiration Notification (Days) to 0.
                                                          • Retain the default values for other parameters.
                                                          +
                                                        3. Choose System > Manage User. On the page displayed, add a dedicated human-machine user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                          • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                          • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                        4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                        5. Synchronize IAM users.
                                                          1. Log in to the MRS console.
                                                          2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                          3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                            • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                            • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                            @@ -186,7 +234,14 @@
                                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1307.html b/docs/dataartsstudio/umn/dataartsstudio_01_1307.html index b2aa6343a..4ac546847 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1307.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1307.html @@ -1,6 +1,6 @@ -

                                                        Configuring an MRS HBase Connection

                                                        +

                                                        MRS HBase Connection Parameters

                                                        @@ -37,8 +37,7 @@ - - @@ -56,12 +55,12 @@ - @@ -70,10 +69,12 @@ @@ -81,16 +82,19 @@ - - @@ -101,8 +105,8 @@ - @@ -110,8 +114,8 @@ - @@ -126,20 +130,20 @@
                                                        Table 1 MRS HBase connection

                                                        Parameter

                                                        Yes

                                                        Select the modules for which this connection is available. The connection can be used in the selected modules.

                                                        -

                                                        All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                        +

                                                        Select the modules for which this connection is available.

                                                        Basic and Network Connectivity Configuration

                                                        @@ -48,7 +47,7 @@

                                                        Yes

                                                        Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                        • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                        • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.
                                                        +
                                                        Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                        • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                        • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.

                                                        Yes

                                                        This parameter is mandatory when Connection String Mode is selected for Manual.

                                                        -
                                                        Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                        NOTE:

                                                        DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                        +

                                                        This parameter is mandatory when Connection String Mode is selected for Manual.

                                                        +
                                                        Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                        NOTE:

                                                        DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                        -

                                                        You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to the Management Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                        -
                                                        Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                        • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                        • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.
                                                        +

                                                        You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to an MRS Cluster Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                        +
                                                        Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                        • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                        • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.

                                                        Yes

                                                        This parameter is mandatory when Cluster Name Mode is selected for Manual.

                                                        -

                                                        MRS cluster that Flink Server belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.

                                                        -
                                                        NOTE:

                                                        DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                        +
                                                        The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                                        NOTE:

                                                        DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                        +
                                                        +
                                                        +
                                                        If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                        • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                        • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                        • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                        +
                                                        NOTE:

                                                        If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                                        -
                                                        If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                        • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and the MRS cluster are in different regions, you need to enable the communications between them through the Internet or a Direct Connect connection. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                        • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                        • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.

                                                        Yes

                                                        KMS key used to encrypt and decrypt the authentication information for the data source

                                                        +
                                                        KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                        NOTE:
                                                        • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                        • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                        +
                                                        +

                                                        Agent

                                                        Yes

                                                        MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first.

                                                        -

                                                        As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the MRS cluster. The security group rule must also allow the CDM cluster communicate with the MRS cluster.

                                                        -
                                                        NOTE:
                                                        • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster cannot connect to multiple MRS security clusters. You are advised to plan multiple agents which are mapped to MRS security clusters one by one.
                                                        • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.
                                                        +

                                                        MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                        +

                                                        As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the MRS cluster. The security group rule must also allow the CDM cluster to communicate with the MRS cluster.

                                                        +
                                                        NOTE:
                                                        • If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                        • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                          +

                                                        Yes

                                                        This parameter is mandatory when Connection String Mode is selected for Manual.

                                                        -
                                                        Authentication method used for accessing MRS
                                                        • SIMPLE: Select this for non-security mode.
                                                        • KERBEROS: Select this for security mode.
                                                        +

                                                        This parameter is mandatory when Connection String Mode is selected for Manual.

                                                        +
                                                        It specifies the authentication method used for accessing the MRS cluster. The following options are available:
                                                        • SIMPLE: for non-security mode
                                                        • KERBEROS: for security mode

                                                        Yes

                                                        Username of the MRS cluster. If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                        -
                                                        To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                        NOTE:
                                                        • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                        • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                        • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                        +

                                                        Username of the MRS cluster If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                        +
                                                        To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                        NOTE:
                                                        • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                        • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                        • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                        -

                                                        Creating a Kerberos Authentication User for an MRS Security Cluster

                                                        To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                        +

                                                        Creating a Kerberos Authentication User for an MRS Security Cluster

                                                        To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                        For clusters of MRS 3.x:

                                                        -
                                                        1. Log in to MRS Manager as user admin.
                                                        2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                          • Set Password Policy Name to neverexp.
                                                          • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                          • Set Password Expiration Notification (Days) to 0.
                                                          • Retain the default values for other parameters.
                                                          -
                                                        3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                          • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                          • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                          • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                          +
                                                          1. Log in to MRS Manager as user admin.
                                                          2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                            • Set Password Policy Name to neverexp.
                                                            • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                            • Set Password Expiration Notification (Days) to 0.
                                                            • Retain the default values for other parameters.
                                                            +
                                                          3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated human-machine user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                            • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                            • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                            • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                            -
                                                          4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                          5. Synchronize IAM users.
                                                            1. Log in to the MRS console.
                                                            2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                            3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                              • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                              • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                              +
                                                            4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                            5. Synchronize IAM users.
                                                              1. Log in to the MRS console.
                                                              2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                              3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.

                                                            For clusters of MRS 2.x or earlier:

                                                            -
                                                            1. Log in to MRS Manager as user admin.
                                                            2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                              • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                              • Set Password Expiration Notification (Days) to 0.
                                                              • Retain the default values for other parameters.
                                                              -
                                                            3. Choose System > Manage User. On the page displayed, add a dedicated user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                              • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                              • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                              +
                                                              1. Log in to the MRS Manager as user admin.
                                                              2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                • Set Password Expiration Notification (Days) to 0.
                                                                • Retain the default values for other parameters.
                                                                +
                                                              3. Choose System > Manage User. On the page displayed, add a dedicated human-machine user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                -
                                                              4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                              5. Synchronize IAM users.
                                                                1. Log in to the MRS console.
                                                                2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                  • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                  • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                  +
                                                                4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                5. Synchronize IAM users.
                                                                  1. Log in to the MRS console.
                                                                  2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                  3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                    • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                    • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                @@ -147,7 +151,7 @@
                                                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1308.html b/docs/dataartsstudio/umn/dataartsstudio_01_1308.html index 992f9fb0b..c882f8546 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1308.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1308.html @@ -1,6 +1,6 @@ -

                                                              Configuring an MRS Kafka Connection

                                                              +

                                                              MRS Kafka Connection Parameters

                                                              @@ -37,8 +37,7 @@ - - @@ -56,12 +55,12 @@ - @@ -69,11 +68,13 @@ - @@ -81,16 +82,19 @@ - - @@ -101,8 +105,8 @@ - @@ -110,8 +114,8 @@ - @@ -126,20 +130,20 @@
                                                              Table 1 MRS Kafka connection

                                                              Parameter

                                                              Yes

                                                              Select the modules for which this connection is available. The connection can be used in the selected modules.

                                                              -

                                                              All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                              +

                                                              Select the modules for which this connection is available.

                                                              Basic and Network Connectivity Configuration

                                                              @@ -48,7 +47,7 @@

                                                              Yes

                                                              Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                              • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                              • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.
                                                              +
                                                              Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                              • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                              • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.

                                                              Yes

                                                              This parameter is mandatory when Connection String Mode is selected for Manual.

                                                              -
                                                              Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                              NOTE:

                                                              DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                              +

                                                              This parameter is mandatory when Connection String Mode is selected for Manual.

                                                              +
                                                              Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                              NOTE:

                                                              DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                              -

                                                              You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to the Management Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                              -
                                                              Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                              • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                              • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.
                                                              +

                                                              You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to an MRS Cluster Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                              +
                                                              Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                              • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                              • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.

                                                              Yes

                                                              This parameter is mandatory when Cluster Name Mode is selected for Manual.

                                                              -

                                                              MRS cluster that Flink Server belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.

                                                              -
                                                              NOTE:

                                                              DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                              +

                                                              This parameter is mandatory when Cluster Name Mode is selected for Manual.

                                                              +
                                                              The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                                              NOTE:

                                                              DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                              +
                                                              +
                                                              +
                                                              If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                              • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                              • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                              • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                              +
                                                              NOTE:

                                                              If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                                              -
                                                              If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                              • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and the MRS cluster are in different regions, you need to enable the communications between them through the Internet or a Direct Connect connection. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                              • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                              • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.

                                                              Yes

                                                              KMS key used to encrypt and decrypt the authentication information for the data source

                                                              +
                                                              KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                              NOTE:
                                                              • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                              • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                              +
                                                              +

                                                              Agent

                                                              Yes

                                                              MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first.

                                                              -

                                                              As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the MRS cluster. The security group rule must also allow the CDM cluster communicate with the MRS cluster.

                                                              -
                                                              NOTE:
                                                              • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster cannot connect to multiple MRS security clusters. You are advised to plan multiple agents which are mapped to MRS security clusters one by one.
                                                              • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.
                                                              +

                                                              MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                              +

                                                              As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the MRS cluster. The security group rule must also allow the CDM cluster to communicate with the MRS cluster.

                                                              +
                                                              NOTE:
                                                              • If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                              • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                                +

                                                              Yes

                                                              This parameter is mandatory when Connection String Mode is selected for Manual.

                                                              -
                                                              Authentication method used for accessing MRS
                                                              • SIMPLE: Select this for non-security mode.
                                                              • KERBEROS: Select this for security mode.
                                                              +

                                                              This parameter is mandatory when Connection String Mode is selected for Manual.

                                                              +
                                                              It specifies the authentication method used for accessing the MRS cluster. The following options are available:
                                                              • SIMPLE: for non-security mode
                                                              • KERBEROS: for security mode

                                                              Yes

                                                              Username of the MRS cluster. If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                              -
                                                              To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                              NOTE:
                                                              • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                              • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                              • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                              • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                              +

                                                              Username of the MRS cluster If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                              +
                                                              To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                              NOTE:
                                                              • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                              • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                              • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                              • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                              -

                                                              Creating a Kerberos Authentication User for an MRS Security Cluster

                                                              To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                              +

                                                              Creating a Kerberos Authentication User for an MRS Security Cluster

                                                              To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                              For clusters of MRS 3.x:

                                                              -
                                                              1. Log in to MRS Manager as user admin.
                                                              2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                • Set Password Policy Name to neverexp.
                                                                • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                • Set Password Expiration Notification (Days) to 0.
                                                                • Retain the default values for other parameters.
                                                                -
                                                              3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                +
                                                                1. Log in to MRS Manager as user admin.
                                                                2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                  • Set Password Policy Name to neverexp.
                                                                  • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                  • Set Password Expiration Notification (Days) to 0.
                                                                  • Retain the default values for other parameters.
                                                                  +
                                                                3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated human-machine user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                  • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                  • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                  • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                  -
                                                                4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                5. Synchronize IAM users.
                                                                  1. Log in to the MRS console.
                                                                  2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                  3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                    • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                    • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                    +
                                                                  4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                  5. Synchronize IAM users.
                                                                    1. Log in to the MRS console.
                                                                    2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                    3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                      • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                      • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.

                                                                  For clusters of MRS 2.x or earlier:

                                                                  -
                                                                  1. Log in to MRS Manager as user admin.
                                                                  2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                    • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                    • Set Password Expiration Notification (Days) to 0.
                                                                    • Retain the default values for other parameters.
                                                                    -
                                                                  3. Choose System > Manage User. On the page displayed, add a dedicated user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                    • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                    • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                    +
                                                                    1. Log in to the MRS Manager as user admin.
                                                                    2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                      • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                      • Set Password Expiration Notification (Days) to 0.
                                                                      • Retain the default values for other parameters.
                                                                      +
                                                                    3. Choose System > Manage User. On the page displayed, add a dedicated human-machine user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                      • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                      • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                      -
                                                                    4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                    5. Synchronize IAM users.
                                                                      1. Log in to the MRS console.
                                                                      2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                      3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                        • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                        • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                        +
                                                                      4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                      5. Synchronize IAM users.
                                                                        1. Log in to the MRS console.
                                                                        2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                        3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                          • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                          • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                      @@ -147,7 +151,7 @@
                                                                    diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1309.html b/docs/dataartsstudio/umn/dataartsstudio_01_1309.html index fa95d00e5..221c1a57f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1309.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1309.html @@ -1,6 +1,6 @@ -

                                                                    Configuring an MRS ClickHouse Connection

                                                                    +

                                                                    MRS ClickHouse Connection Parameters

                                                                    @@ -37,8 +37,7 @@ - - @@ -56,12 +55,12 @@ - @@ -69,11 +68,13 @@ - @@ -81,17 +82,20 @@ - - @@ -102,8 +106,8 @@ - @@ -111,8 +115,8 @@ - @@ -127,20 +131,20 @@
                                                                    Table 1 MRS ClickHouse connection

                                                                    Parameter

                                                                    Yes

                                                                    Select the modules for which this connection is available. The connection can be used in the selected modules.

                                                                    -

                                                                    All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                                    +

                                                                    Select the modules for which this connection is available.

                                                                    Basic and Network Connectivity Configuration

                                                                    @@ -48,7 +47,7 @@

                                                                    Yes

                                                                    Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                                    • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                                    • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.
                                                                    +
                                                                    Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                                    • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                                    • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.

                                                                    Yes

                                                                    This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                    -
                                                                    Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                                    NOTE:

                                                                    DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                    +

                                                                    This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                    +
                                                                    Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                                    NOTE:

                                                                    DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                    -

                                                                    You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to the Management Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                                    -
                                                                    Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                                    • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                                    • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.
                                                                    +

                                                                    You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to an MRS Cluster Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                                    +
                                                                    Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                                    • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                                    • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.

                                                                    Yes

                                                                    This parameter is mandatory when Cluster Name Mode is selected for Manual.

                                                                    -

                                                                    MRS cluster that Flink Server belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.

                                                                    -
                                                                    NOTE:

                                                                    DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                    +

                                                                    This parameter is mandatory when Cluster Name Mode is selected for Manual.

                                                                    +
                                                                    The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                                                    NOTE:

                                                                    DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                    +
                                                                    +
                                                                    +
                                                                    If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                                    • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                                    • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                                    • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                                    +
                                                                    NOTE:

                                                                    If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                                                    -
                                                                    If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                                    • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and the MRS cluster are in different regions, you need to enable the communications between them through the Internet or a Direct Connect connection. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                                    • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                                    • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.

                                                                    Yes

                                                                    KMS key used to encrypt and decrypt the authentication information for the data source

                                                                    +
                                                                    KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                                    NOTE:
                                                                    • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                                    • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                                    +
                                                                    +

                                                                    Agent

                                                                    Yes

                                                                    MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first.

                                                                    -

                                                                    As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the MRS cluster. The security group rule must also allow the CDM cluster communicate with the MRS cluster.

                                                                    -
                                                                    NOTE:
                                                                    • MRS ClickHouse connections are supported only in CDM 2.9.2 and later versions.
                                                                    • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster cannot connect to multiple MRS security clusters. You are advised to plan multiple agents which are mapped to MRS security clusters one by one.
                                                                    -
                                                                    • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.
                                                                    +

                                                                    MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                                    +

                                                                    As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the MRS cluster. The security group rule must also allow the CDM cluster to communicate with the MRS cluster.

                                                                    +
                                                                    NOTE:
                                                                    • MRS ClickHouse connections are supported only in CDM 2.9.2 and later versions.
                                                                    • If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                                    +
                                                                    • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                                      +

                                                                    Yes

                                                                    This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                    -
                                                                    Authentication method used for accessing MRS
                                                                    • SIMPLE: Select this for non-security mode.
                                                                    • KERBEROS: Select this for security mode.
                                                                    +

                                                                    This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                    +
                                                                    It specifies the authentication method used for accessing the MRS cluster. The following options are available:
                                                                    • SIMPLE: for non-security mode
                                                                    • KERBEROS: for security mode

                                                                    Yes

                                                                    Username of the MRS cluster. If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                                    -
                                                                    To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                                    NOTE:
                                                                    • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                    • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                    • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                    • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                                    +

                                                                    Username of the MRS cluster If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                                    +
                                                                    To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                                    NOTE:
                                                                    • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                    • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                    • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                    • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                                    -

                                                                    Creating a Kerberos Authentication User for an MRS Security Cluster

                                                                    To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                                    +

                                                                    Creating a Kerberos Authentication User for an MRS Security Cluster

                                                                    To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                                    For clusters of MRS 3.x:

                                                                    -
                                                                    1. Log in to MRS Manager as user admin.
                                                                    2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                      • Set Password Policy Name to neverexp.
                                                                      • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                      • Set Password Expiration Notification (Days) to 0.
                                                                      • Retain the default values for other parameters.
                                                                      -
                                                                    3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                      • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                      • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                      • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                      +
                                                                      1. Log in to MRS Manager as user admin.
                                                                      2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                        • Set Password Policy Name to neverexp.
                                                                        • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                        • Set Password Expiration Notification (Days) to 0.
                                                                        • Retain the default values for other parameters.
                                                                        +
                                                                      3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated human-machine user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                        • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                        • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                        -
                                                                      4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                      5. Synchronize IAM users.
                                                                        1. Log in to the MRS console.
                                                                        2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                        3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                          • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                          • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                          +
                                                                        4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                        5. Synchronize IAM users.
                                                                          1. Log in to the MRS console.
                                                                          2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                          3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                            • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                            • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.

                                                                        For clusters of MRS 2.x or earlier:

                                                                        -
                                                                        1. Log in to MRS Manager as user admin.
                                                                        2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                          • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                          • Set Password Expiration Notification (Days) to 0.
                                                                          • Retain the default values for other parameters.
                                                                          -
                                                                        3. Choose System > Manage User. On the page displayed, add a dedicated user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                          • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                          • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                          +
                                                                          1. Log in to the MRS Manager as user admin.
                                                                          2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                            • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                            • Set Password Expiration Notification (Days) to 0.
                                                                            • Retain the default values for other parameters.
                                                                            +
                                                                          3. Choose System > Manage User. On the page displayed, add a dedicated human-machine user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                            • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                            • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                            -
                                                                          4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                          5. Synchronize IAM users.
                                                                            1. Log in to the MRS console.
                                                                            2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                            3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                              • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                              • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                              +
                                                                            4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                            5. Synchronize IAM users.
                                                                              1. Log in to the MRS console.
                                                                              2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                              3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                            @@ -148,7 +152,7 @@
                                                                          diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1310.html b/docs/dataartsstudio/umn/dataartsstudio_01_1310.html index f27d04498..51ddc6526 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1310.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1310.html @@ -1,6 +1,6 @@ -

                                                                          Configuring an MRS Hetu Connection

                                                                          +

                                                                          MRS Hetu Connection Parameters

                                                                          @@ -37,8 +37,7 @@ - - @@ -56,14 +55,14 @@ - @@ -71,13 +70,15 @@ - @@ -85,16 +86,19 @@ - - @@ -123,8 +127,8 @@ - @@ -133,10 +137,10 @@ @@ -150,20 +154,20 @@
                                                                          Table 1 MRS Hetu connection

                                                                          Parameter

                                                                          Yes

                                                                          Select the modules for which this connection is available. The connection can be used in the selected modules.

                                                                          -

                                                                          All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                                          +

                                                                          Select the modules for which this connection is available.

                                                                          Basic and Network Connectivity Configuration

                                                                          @@ -48,7 +47,7 @@

                                                                          Yes

                                                                          Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                                          • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                                          • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.
                                                                          +
                                                                          Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                                          • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                                          • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.

                                                                          Yes

                                                                          This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                          -
                                                                          Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                                          NOTE:

                                                                          DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                          +

                                                                          This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                          +
                                                                          Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                                          NOTE:

                                                                          DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                          NOTE:
                                                                          • MRS clusters of version 3.1.1 and later can be connected.
                                                                          • To connect to MRS clusters of version 3.2.1, add parameter protocol.v1.alternate-header-name with value Presto in the coordinator.config.properties and worker.config.properties files for the compute instance on the HetuEngine WebUI.
                                                                          -

                                                                          You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to the Management Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                                          -
                                                                          Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                                          • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                                          • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.
                                                                          +

                                                                          You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to an MRS Cluster Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                                          +
                                                                          Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                                          • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                                          • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.

                                                                          Yes

                                                                          This parameter is mandatory when Cluster Name Mode is selected for Manual.

                                                                          -

                                                                          MRS cluster that Flink Server belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.

                                                                          -
                                                                          NOTE:

                                                                          DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                          +

                                                                          This parameter is mandatory when Cluster Name Mode is selected for Manual.

                                                                          +
                                                                          The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                                                          NOTE:

                                                                          DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                          -
                                                                          NOTE:
                                                                          • MRS clusters of version 3.1.1 and later can be connected.
                                                                          • To connect to MRS clusters of version 3.2.1, add parameter protocol.v1.alternate-header-name with value Presto in the coordinator.config.properties and worker.config.properties files for the compute instance on the HetuEngine WebUI.
                                                                          +
                                                                          +
                                                                          NOTE:
                                                                          • MRS clusters of version 3.1.1 and later can be connected.
                                                                          • To connect to MRS clusters of version 3.2.1, add parameter protocol.v1.alternate-header-name with value Presto in the coordinator.config.properties and worker.config.properties files for the compute instance on the HetuEngine WebUI.
                                                                          +
                                                                          +
                                                                          If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                                          • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                                          • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                                          • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                                          +
                                                                          NOTE:

                                                                          If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                                                          -
                                                                          If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                                          • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and the MRS cluster are in different regions, you need to enable the communications between them through the Internet or a Direct Connect connection. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                                          • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                                          • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.

                                                                          Yes

                                                                          KMS key used to encrypt and decrypt the authentication information for the data source

                                                                          +
                                                                          KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                                          NOTE:
                                                                          • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                                          • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                                          +
                                                                          +

                                                                          Agent

                                                                          Yes

                                                                          MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first.

                                                                          -

                                                                          As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the MRS cluster. The security group rule must also allow the CDM cluster communicate with the MRS cluster.

                                                                          -
                                                                          NOTE:
                                                                          • MRS Hetu connections are supported only in CDM 2.9.2 and later versions.
                                                                          • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster cannot connect to multiple MRS security clusters. You are advised to plan multiple agents which are mapped to MRS security clusters one by one.
                                                                          • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.
                                                                          +

                                                                          MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                                          +

                                                                          As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the MRS cluster. The security group rule must also allow the CDM cluster to communicate with the MRS cluster.

                                                                          +
                                                                          NOTE:
                                                                          • MRS Hetu connections are supported only in CDM 2.9.2 and later versions.
                                                                          • If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                                          • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                                            +

                                                                          Yes

                                                                          This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                          -
                                                                          Authentication method used for accessing MRS
                                                                          • SIMPLE: Select this for non-security mode.
                                                                          • KERBEROS: Select this for security mode.
                                                                          +

                                                                          This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                          +
                                                                          It specifies the authentication method used for accessing the MRS cluster. The following options are available:
                                                                          • SIMPLE: for non-security mode
                                                                          • KERBEROS: for security mode

                                                                          Yes

                                                                          Username of the MRS cluster. The user must have permissions of HetuEngine.

                                                                          -
                                                                          To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                                          NOTE:
                                                                          • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                          • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                          • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                          • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                                          +
                                                                          To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                                          NOTE:
                                                                          • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                          • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                          • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                          • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                                          -
                                                                          NOTICE:

                                                                          After creating the HetuEngine user, you need to complete the configurations in "Using HetuEngine from Scratch" in MapReduce Service (MRS) x.x.x Usage Guide.

                                                                          +
                                                                          NOTICE:

                                                                          After creating the HetuEngine user, you need to complete the configurations in "Using HetuEngine from Scratch" in MapReduce Service (MRS) x.x.x Usage Guide.

                                                                          -

                                                                          Creating a Kerberos Authentication User for an MRS Security Cluster

                                                                          To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                                          +

                                                                          Creating a Kerberos Authentication User for an MRS Security Cluster

                                                                          To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                                          For clusters of MRS 3.x:

                                                                          -
                                                                          1. Log in to MRS Manager as user admin.
                                                                          2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                            • Set Password Policy Name to neverexp.
                                                                            • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                            • Set Password Expiration Notification (Days) to 0.
                                                                            • Retain the default values for other parameters.
                                                                            -
                                                                          3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                            • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                            • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                            • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                            +
                                                                            1. Log in to MRS Manager as user admin.
                                                                            2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                              • Set Password Policy Name to neverexp.
                                                                              • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                              • Set Password Expiration Notification (Days) to 0.
                                                                              • Retain the default values for other parameters.
                                                                              +
                                                                            3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated human-machine user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                              • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                              • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                              • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                              -
                                                                            4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                            5. Synchronize IAM users.
                                                                              1. Log in to the MRS console.
                                                                              2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                              3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                                +
                                                                              4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                              5. Synchronize IAM users.
                                                                                1. Log in to the MRS console.
                                                                                2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                  • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                  • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.

                                                                              For clusters of MRS 2.x or earlier:

                                                                              -
                                                                              1. Log in to MRS Manager as user admin.
                                                                              2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                                • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                • Set Password Expiration Notification (Days) to 0.
                                                                                • Retain the default values for other parameters.
                                                                                -
                                                                              3. Choose System > Manage User. On the page displayed, add a dedicated user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                +
                                                                                1. Log in to the MRS Manager as user admin.
                                                                                2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                                  • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                  • Set Password Expiration Notification (Days) to 0.
                                                                                  • Retain the default values for other parameters.
                                                                                  +
                                                                                3. Choose System > Manage User. On the page displayed, add a dedicated human-machine user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                  • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                  • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                  -
                                                                                4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                5. Synchronize IAM users.
                                                                                  1. Log in to the MRS console.
                                                                                  2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                  3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                    • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                    • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                                    +
                                                                                  4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                  5. Synchronize IAM users.
                                                                                    1. Log in to the MRS console.
                                                                                    2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                    3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                      • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                      • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                                  @@ -171,7 +175,7 @@
                                                                                diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1311.html b/docs/dataartsstudio/umn/dataartsstudio_01_1311.html index 5ee58aa26..44d6d4ee9 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1311.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1311.html @@ -1,6 +1,6 @@ -

                                                                                Configuring an MRS Impala Connection

                                                                                +

                                                                                MRS Impala Connection Parameters

                                                                                @@ -37,8 +37,7 @@ - - @@ -56,12 +55,12 @@ - @@ -69,11 +68,13 @@ - @@ -81,16 +82,19 @@ - - @@ -110,8 +114,8 @@ - @@ -119,8 +123,8 @@ - @@ -129,7 +133,7 @@ -
                                                                                Table 1 MRS Impala connection

                                                                                Parameter

                                                                                Yes

                                                                                Select the modules for which this connection is available. The connection can be used in the selected modules.

                                                                                -

                                                                                All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                                                +

                                                                                Select the modules for which this connection is available.

                                                                                Basic and Network Connectivity Configuration

                                                                                @@ -48,7 +47,7 @@

                                                                                Yes

                                                                                Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                                                • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                                                • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.
                                                                                +
                                                                                Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                                                • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                                                • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.

                                                                                Yes

                                                                                This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                -
                                                                                Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                                                NOTE:

                                                                                DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                                +

                                                                                This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                +
                                                                                Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                                                NOTE:

                                                                                DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                                -

                                                                                You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to the Management Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                                                -
                                                                                Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                                                • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                                                • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.
                                                                                +

                                                                                You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to an MRS Cluster Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                                                +
                                                                                Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                                                • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                                                • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.

                                                                                Yes

                                                                                This parameter is mandatory when Cluster Name Mode is selected for Manual.

                                                                                -

                                                                                MRS cluster that Flink Server belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.

                                                                                -
                                                                                NOTE:

                                                                                DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                                +

                                                                                This parameter is mandatory when Cluster Name Mode is selected for Manual.

                                                                                +
                                                                                The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                                                                NOTE:

                                                                                DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                                +
                                                                                +
                                                                                +
                                                                                If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                                                • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                                                • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                                                • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                                                +
                                                                                NOTE:

                                                                                If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                                                                -
                                                                                If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                                                • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and the MRS cluster are in different regions, you need to enable the communications between them through the Internet or a Direct Connect connection. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                                                • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                                                • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.

                                                                                Yes

                                                                                KMS key used to encrypt and decrypt the authentication information for the data source

                                                                                +
                                                                                KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                                                NOTE:
                                                                                • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                                                • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                                                +
                                                                                +

                                                                                Agent

                                                                                Yes

                                                                                MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first.

                                                                                -

                                                                                As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the MRS cluster. The security group rule must also allow the CDM cluster communicate with the MRS cluster.

                                                                                -
                                                                                NOTE:
                                                                                • MRS Impala connections are supported only in CDM 2.9.2 and later versions.
                                                                                • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster cannot connect to multiple MRS security clusters. You are advised to plan multiple agents which are mapped to MRS security clusters one by one.
                                                                                • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.
                                                                                +

                                                                                MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                                                +

                                                                                As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the MRS cluster. The security group rule must also allow the CDM cluster to communicate with the MRS cluster.

                                                                                +
                                                                                NOTE:
                                                                                • MRS Impala connections are supported only in CDM 2.9.2 and later versions.
                                                                                • If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                                                • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                                                  +

                                                                                Yes

                                                                                This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                -
                                                                                Authentication method used for accessing MRS
                                                                                • SIMPLE: Select this for non-security mode.
                                                                                • KERBEROS: Select this for security mode.
                                                                                +

                                                                                This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                +
                                                                                It specifies the authentication method used for accessing the MRS cluster. The following options are available:
                                                                                • SIMPLE: for non-security mode
                                                                                • KERBEROS: for security mode

                                                                                Yes

                                                                                Human-machine user of the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection. If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                                                -
                                                                                To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                                                NOTE:
                                                                                • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                                • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                                                +

                                                                                Human-machine user of the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection. If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                                                +
                                                                                To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                                                NOTE:
                                                                                • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                                • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.

                                                                                Yes

                                                                                The password for accessing the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                +

                                                                                The password for accessing the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                Enable ldap

                                                                                @@ -159,20 +163,20 @@
                                                                                -

                                                                                Creating a Kerberos Authentication User for an MRS Security Cluster

                                                                                To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                                                +

                                                                                Creating a Kerberos Authentication User for an MRS Security Cluster

                                                                                To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                                                For clusters of MRS 3.x:

                                                                                -
                                                                                1. Log in to MRS Manager as user admin.
                                                                                2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                                  • Set Password Policy Name to neverexp.
                                                                                  • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                  • Set Password Expiration Notification (Days) to 0.
                                                                                  • Retain the default values for other parameters.
                                                                                  -
                                                                                3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                  • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                                  • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                  • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                  +
                                                                                  1. Log in to MRS Manager as user admin.
                                                                                  2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                                    • Set Password Policy Name to neverexp.
                                                                                    • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                    • Set Password Expiration Notification (Days) to 0.
                                                                                    • Retain the default values for other parameters.
                                                                                    +
                                                                                  3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated human-machine user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                    • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                                    • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                    • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                    -
                                                                                  4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                  5. Synchronize IAM users.
                                                                                    1. Log in to the MRS console.
                                                                                    2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                    3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                      • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                      • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                                      +
                                                                                    4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                    5. Synchronize IAM users.
                                                                                      1. Log in to the MRS console.
                                                                                      2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                      3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                        • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                        • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.

                                                                                    For clusters of MRS 2.x or earlier:

                                                                                    -
                                                                                    1. Log in to MRS Manager as user admin.
                                                                                    2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                                      • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                      • Set Password Expiration Notification (Days) to 0.
                                                                                      • Retain the default values for other parameters.
                                                                                      -
                                                                                    3. Choose System > Manage User. On the page displayed, add a dedicated user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                      • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                      • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                      +
                                                                                      1. Log in to the MRS Manager as user admin.
                                                                                      2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                                        • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                        • Set Password Expiration Notification (Days) to 0.
                                                                                        • Retain the default values for other parameters.
                                                                                        +
                                                                                      3. Choose System > Manage User. On the page displayed, add a dedicated human-machine user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                        • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                        -
                                                                                      4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                      5. Synchronize IAM users.
                                                                                        1. Log in to the MRS console.
                                                                                        2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                        3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                          • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                          • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                                          +
                                                                                        4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                        5. Synchronize IAM users.
                                                                                          1. Log in to the MRS console.
                                                                                          2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                          3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                            • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                            • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                                        @@ -180,7 +184,7 @@
                                                                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1314.html b/docs/dataartsstudio/umn/dataartsstudio_01_1314.html index 2628cf477..f1fa62472 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1314.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1314.html @@ -1,6 +1,6 @@ -

                                                                                      Configuring an MRS Spark Connection

                                                                                      +

                                                                                      MRS Spark Connection Parameters

                                                                                      @@ -37,8 +37,7 @@ - - - @@ -70,12 +69,12 @@ - @@ -83,11 +82,13 @@ - @@ -95,18 +96,21 @@ - - @@ -117,8 +121,8 @@ - @@ -126,7 +130,7 @@ - @@ -134,7 +138,7 @@ - @@ -142,8 +146,8 @@ - @@ -152,26 +156,26 @@ -
                                                                                      Table 1 MRS Spark connection

                                                                                      Parameter

                                                                                      Yes

                                                                                      Select the modules for which this connection is available. The connection can be used in the selected modules.

                                                                                      -

                                                                                      All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                                                      +

                                                                                      Select the modules for which this connection is available.

                                                                                      Basic and Network Connectivity Configuration

                                                                                      @@ -48,7 +47,7 @@

                                                                                      Yes

                                                                                      Connection type. Proxy connection is recommended.
                                                                                      • Proxy connection: An agent (CDM cluster) is used to access MRS clusters. This method supports all versions of MRS clusters.
                                                                                      • MRS API connection: MRS APIs are used to access MRS clusters. This method supports only MRS clusters of the 2.X or a later version.

                                                                                        When you select MRS API connection, pay attention to the following restrictions:

                                                                                        +
                                                                                      Connection type. Proxy connection is recommended.
                                                                                      • Proxy connection: An agent (CDM cluster) is used to access MRS clusters. This method supports all versions of MRS clusters.
                                                                                      • MRS API connection: MRS APIs are used to access MRS clusters. This method supports only MRS clusters of the 2.X or a later version.

                                                                                        When you select MRS API connection, pay attention to the following restrictions:

                                                                                        1. In DataArts Factory, you cannot view or manage the databases, data tables, and fields of the connection in a visualized manner. If an MRS cluster of version 3.2.1 or later is connected, you can view rather than manage the databases, data tables, and fields of the connection in a visualized manner.
                                                                                        2. When the SQL editor of DataArts Factory is used to run SQL statements, the execution results can be displayed only in logs.
                                                                                      @@ -61,8 +60,8 @@

                                                                                      Yes

                                                                                      This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                      -
                                                                                      Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                                                      • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                                                      • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.
                                                                                      +

                                                                                      This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                      +
                                                                                      Select the connection mode. If you do not need to access MRS clusters in other projects or enterprise projects, select Cluster Name Mode.
                                                                                      • Cluster Name Mode: Select an existing cluster. You can only connect to an MRS cluster in the same project and enterprise project.
                                                                                      • If you select Connection String Mode, you can set Manager IP and enable communication between this connection's agent (CDM cluster) and an MRS cluster in another project or enterprise project so that you can access the MRS cluster.

                                                                                      Yes

                                                                                      This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                      -
                                                                                      Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                                                      NOTE:

                                                                                      DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                                      +

                                                                                      This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                      +
                                                                                      Set this parameter to the floating IP address of MRS Manager. Only MRS clusters are supported. A Hadoop cluster can be connected only after it is managed by MRS.
                                                                                      NOTE:

                                                                                      DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                                      -

                                                                                      You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to the Management Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                                                      -
                                                                                      Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                                                      • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                                                      • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.
                                                                                      +

                                                                                      You can click Select next to the text box and select an MRS cluster in the same project and enterprise project. If you want to access an MRS cluster in another project or enterprise project, obtain and enter the floating IP address of MRS Manager and ensure that the connection's agent (CDM cluster) can communicate with the tenant-plane MRS cluster. To obtain the floating IP address of MRS Manager, log in to the active master node of the MRS cluster and run the ifconfig command. In the command output, the IP address of eth0:wsom is the floating IP address of MRS Manager. For details about how to log in to the master node of the MRS cluster, see "Manager Operation Guide" > "Getting Started" > "Logging In to an MRS Cluster Node" in MapReduce Service (MRS) x.x.x User Guide.

                                                                                      +
                                                                                      Enter multiple IP addresses based on the scenario in sequence and separate them with commas (,), for example, 127.0.0.1 or 127.0.0.1,127.0.0.2,127.0.0.3.
                                                                                      • If you enter one IP address, enter the management-plane floating IP address of the MRS cluster.
                                                                                      • If you enter three IP addresses, enter the IP address of the active node on the MRS cluster service plane, IP address of the standby node on the MRS cluster service plane, and the floating IP address of the MRS cluster management plane.

                                                                                      Yes

                                                                                      This parameter is mandatory when MRS API connection is selected for Connection Type or Cluster Name Mode is selected for Manual.

                                                                                      -

                                                                                      MRS cluster that Flink Server belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.

                                                                                      -
                                                                                      NOTE:

                                                                                      DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                                      +

                                                                                      This parameter is mandatory when MRS API connection is selected for Connection Type or Cluster Name Mode is selected for Manual.

                                                                                      +
                                                                                      The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                                                                      NOTE:

                                                                                      DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                                                      +
                                                                                      +
                                                                                      +
                                                                                      If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                                                      • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                                                      • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                                                      • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                                                      +
                                                                                      NOTE:

                                                                                      If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                                                                      -
                                                                                      If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                                                      • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and the MRS cluster are in different regions, you need to enable the communications between them through the Internet or a Direct Connect connection. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                                                      • If the DataArts Studio instance (CDM cluster in the DataArts Studio instance) and MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                                                      • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.

                                                                                      Yes

                                                                                      This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                      -

                                                                                      KMS key used to encrypt and decrypt the authentication information for the data source

                                                                                      +

                                                                                      This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                      +
                                                                                      KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                                                      NOTE:
                                                                                      • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                                                      • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                                                      +
                                                                                      +

                                                                                      Agent

                                                                                      Yes

                                                                                      This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                      -

                                                                                      MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first.

                                                                                      -

                                                                                      As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the MRS cluster. The security group rule must also allow the CDM cluster communicate with the MRS cluster.

                                                                                      -
                                                                                      NOTE:
                                                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster cannot connect to multiple MRS security clusters. You are advised to plan multiple agents which are mapped to MRS security clusters one by one.
                                                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.
                                                                                      +

                                                                                      This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                      +

                                                                                      MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                                                      +

                                                                                      As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the MRS cluster. The security group rule must also allow the CDM cluster to communicate with the MRS cluster.

                                                                                      +
                                                                                      NOTE:
                                                                                      • If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                                                        +

                                                                                      Yes

                                                                                      This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                      -
                                                                                      Authentication method used for accessing MRS
                                                                                      • SIMPLE: Select this for non-security mode.
                                                                                      • KERBEROS: Select this for security mode.
                                                                                      +

                                                                                      This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                      +
                                                                                      It specifies the authentication method used for accessing the MRS cluster. The following options are available:
                                                                                      • SIMPLE: for non-security mode
                                                                                      • KERBEROS: for security mode

                                                                                      No

                                                                                      This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                      +

                                                                                      This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                      Select the MRS cluster version.

                                                                                      No

                                                                                      This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                      +

                                                                                      This parameter is mandatory when Connection String Mode is selected for Manual.

                                                                                      Select the Spark version.

                                                                                      Yes

                                                                                      Human-machine user of the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection. If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                                                      -
                                                                                      To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                                                      NOTE:
                                                                                      • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                                      • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                      • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                      • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.
                                                                                      +

                                                                                      Human-machine user of the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection. If a new MRS user is used for connection, you need to log in to Manager and change the initial password.

                                                                                      +
                                                                                      To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. You can create an MRS user whose password never expires by referring to Creating a Kerberos Authentication User for an MRS Security Cluster. When creating an MRS data connection, set Username and Password to the new MRS username and password.
                                                                                      NOTE:
                                                                                      • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                                      • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                      • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                      • You are advised to set a user password that never expires to prevent connection failures and service loss caused by password expiration.

                                                                                      Yes

                                                                                      The password for accessing the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                      +

                                                                                      The password for accessing the MRS cluster. This parameter is mandatory when Connection Type is set to Proxy connection.

                                                                                      -

                                                                                      Creating a Kerberos Authentication User for an MRS Security Cluster

                                                                                      To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                                                      +

                                                                                      Creating a Kerberos Authentication User for an MRS Security Cluster

                                                                                      To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                                                      For clusters of MRS 3.x:

                                                                                      -
                                                                                      1. Log in to MRS Manager as user admin.
                                                                                      2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                                        • Set Password Policy Name to neverexp.
                                                                                        • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                        • Set Password Expiration Notification (Days) to 0.
                                                                                        • Retain the default values for other parameters.
                                                                                        -
                                                                                      3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                        • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                                        • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                        +
                                                                                        1. Log in to MRS Manager as user admin.
                                                                                        2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                                                          • Set Password Policy Name to neverexp.
                                                                                          • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                          • Set Password Expiration Notification (Days) to 0.
                                                                                          • Retain the default values for other parameters.
                                                                                          +
                                                                                        3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated human-machine user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                          • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                                                          • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                          • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                          -
                                                                                        4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                        5. Synchronize IAM users.
                                                                                          1. Log in to the MRS console.
                                                                                          2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                          3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                            • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                            • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                                            +
                                                                                          4. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                          5. Synchronize IAM users.
                                                                                            1. Log in to the MRS console.
                                                                                            2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                            3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                              • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                              • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.

                                                                                          For clusters of MRS 2.x or earlier:

                                                                                          -
                                                                                          1. Log in to MRS Manager as user admin.
                                                                                          2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                                            • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                            • Set Password Expiration Notification (Days) to 0.
                                                                                            • Retain the default values for other parameters.
                                                                                            -
                                                                                          3. Choose System > Manage User. On the page displayed, add a dedicated user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                            • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                            • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                            +
                                                                                            1. Log in to the MRS Manager as user admin.
                                                                                            2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                                                              • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                                                              • Set Password Expiration Notification (Days) to 0.
                                                                                              • Retain the default values for other parameters.
                                                                                              +
                                                                                            3. Choose System > Manage User. On the page displayed, add a dedicated human-machine user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                                                              • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                                                              • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                                                              -
                                                                                            4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                            5. Synchronize IAM users.
                                                                                              1. Log in to the MRS console.
                                                                                              2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                              3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                                • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                                • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                                                +
                                                                                              4. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                                                              5. Synchronize IAM users.
                                                                                                1. Log in to the MRS console.
                                                                                                2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                                                                3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                                                                  • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                                                                  • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                                                              @@ -179,7 +183,7 @@
                                                                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1321.html b/docs/dataartsstudio/umn/dataartsstudio_01_1321.html new file mode 100644 index 000000000..64de53b92 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1321.html @@ -0,0 +1,87 @@ + + +

                                                                                            OpenSource ClickHouse Connection Parameters

                                                                                            +
                                                                                            +
                                                                                            + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                                                            Table 1 OpenSource ClickHouse connection

                                                                                            Parameter

                                                                                            +

                                                                                            Mandatory

                                                                                            +

                                                                                            Description

                                                                                            +

                                                                                            Data Connection Type

                                                                                            +

                                                                                            Yes

                                                                                            +

                                                                                            OpenSource ClickHouse is selected by default and cannot be changed.

                                                                                            +

                                                                                            Name

                                                                                            +

                                                                                            Yes

                                                                                            +

                                                                                            Name of the data connection to create. Data connection names can contain a maximum of 100 characters. They can contain only letters, digits, underscores (_), and hyphens (-).

                                                                                            +

                                                                                            Tag

                                                                                            +

                                                                                            No

                                                                                            +
                                                                                            Attribute of the data connection to create. Tags make management easier.
                                                                                            NOTE:

                                                                                            The tag name can contain only letters, digits, and underscores (_) and cannot start with an underscore (_) or contain more than 100 characters.

                                                                                            +
                                                                                            +
                                                                                            +

                                                                                            Applicable Modules

                                                                                            +

                                                                                            Yes

                                                                                            +

                                                                                            Select the modules for which this connection is available.

                                                                                            +

                                                                                            Basic and Network Connectivity Configuration

                                                                                            +

                                                                                            IP Address

                                                                                            +

                                                                                            Yes

                                                                                            +

                                                                                            IP address of the node where the ClickHouseServer is located

                                                                                            +

                                                                                            Port

                                                                                            +

                                                                                            Yes

                                                                                            +

                                                                                            Used to receive JDBC requests. By default, the value of the http_port parameter of ClickHouseServer is used.

                                                                                            +

                                                                                            KMS Key

                                                                                            +

                                                                                            Yes

                                                                                            +
                                                                                            KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                                                            NOTE:
                                                                                            • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                                                            • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                                                            +
                                                                                            +
                                                                                            +

                                                                                            Agent

                                                                                            +

                                                                                            Yes

                                                                                            +

                                                                                            As a network proxy, the CDM cluster must be able to communicate with the ClickHouseServer. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                                                            +
                                                                                            NOTE:

                                                                                            If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                                                            +
                                                                                            +
                                                                                            +
                                                                                            +
                                                                                            + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1380.html b/docs/dataartsstudio/umn/dataartsstudio_01_1380.html index b1178de2f..0bed99211 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1380.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1380.html @@ -1,6 +1,6 @@ -

                                                                                            Link to Elasticsearch

                                                                                            +

                                                                                            Elasticsearch Link Parameters

                                                                                            Elasticsearch links can be used to connect to Elasticsearch services in third-party clouds and local data centers and on Elastic Cloud Servers (ECSs).

                                                                                            • The Elasticsearch connector only supports Elasticsearch clusters in non-security mode.
                                                                                            • Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.
                                                                                            @@ -18,7 +18,7 @@

                                                      Link name, which should be defined based on the data source type, so it is easier to remember what the link is for

                                                      css_link

                                                      +

                                                      es_link

                                                      Elasticsearch Server List

                                                      @@ -34,7 +34,7 @@
                                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1390.html b/docs/dataartsstudio/umn/dataartsstudio_01_1390.html index 123cb8c49..f4adc1e43 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1390.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1390.html @@ -1,6 +1,6 @@ -

                                                      Configuring an MRS Doris Connection

                                                      +

                                                      Doris Connection Parameters

                                                      @@ -14,7 +14,7 @@ - - - + + + + @@ -121,7 +131,8 @@ -
                                                      Table 1 MRS Doris connection

                                                      Parameter

                                                      Yes

                                                      MRS Doris is selected by default and cannot be changed.

                                                      +

                                                      Doris is selected by default and cannot be changed.

                                                      Name

                                                      @@ -38,7 +38,6 @@

                                                      Yes

                                                      Select the modules for which this connection is available.

                                                      -

                                                      All modules are selected by default, which means this connection is available for all the modules that support the data source connected by this connection. For details about the data sources supported by each module, see Data Sources.

                                                      Basic and Network Connectivity Configuration

                                                      @@ -56,13 +55,15 @@

                                                      Yes

                                                      This parameter is valid when Doris Type is set to MRS Doris.

                                                      -

                                                      The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.

                                                      -
                                                      NOTE:

                                                      DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                      +
                                                      NOTE:

                                                      This parameter is available only for MRS clusters of version 3.2.0 or later.

                                                      +
                                                      +
                                                      The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                                      NOTE:

                                                      DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                      -
                                                      If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                      • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                      • If the CDM cluster in the DataArts Studio instance and the cloud service are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding a Custom Route" in Virtual Private Cloud (VPC) Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) Usage Guide.
                                                      • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                      -
                                                      NOTE:

                                                      Only non-security MRS clusters of version 3.2.0 and later support this connection.

                                                      +
                                                      If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                      • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                      • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                      • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                      +
                                                      NOTE:

                                                      If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                                      +

                                                      FE IP

                                                      @@ -87,19 +88,28 @@

                                                      Yes

                                                      KMS key used to encrypt and decrypt the authentication information for the data source

                                                      +
                                                      KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                      NOTE:
                                                      • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                      • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                      +
                                                      +

                                                      Agent

                                                      Yes

                                                      MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first.

                                                      -

                                                      As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region, AZ, VPC, and subnet as the MRS cluster. The security group rule must also allow the CDM cluster communicate with the MRS cluster.

                                                      -
                                                      NOTE:
                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster cannot connect to multiple MRS security clusters. You are advised to plan multiple agents which are mapped to MRS security clusters one by one.
                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.
                                                      +

                                                      MRS is not a fully managed service and cannot be directly connected to DataArts Studio. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an MRS data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                      +

                                                      As a network proxy, the CDM cluster must be able to communicate with the MRS cluster. To ensure network connectivity, the CDM cluster must be in the same region and AZ and use the same VPC and subnet as the MRS cluster. The security group rule must also allow the CDM cluster to communicate with the MRS cluster.

                                                      +
                                                      NOTE:
                                                      • If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                      • If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                      SSL Encryption

                                                      +

                                                      No

                                                      +

                                                      Whether to enable SSL encrypted transmission. This function is enabled by default. Disable it if SSL is disabled at the source.

                                                      +

                                                      Data Source Driver Configuration

                                                      Yes

                                                      Path of the driver file in the OBS bucket. You need to download the .jar driver file from the corresponding official website and upload it to the OBS bucket.

                                                      +

                                                      This parameter is mandatory when Driver file source is set to OBS path.

                                                      +

                                                      Path of the driver file in the OBS bucket. You need to download the .jar driver file from the corresponding official website and upload it to the OBS bucket.

                                                      MySQL driver: Obtain the driver from https://downloads.mysql.com/archives/c-j/. Version 5.1.48 or later is recommended. If the version is earlier than 5.1.48, error "The db user or password invalid" will be reported.

                                                      NOTE:

                                                      To update the driver, you must restart the CDM cluster in DataArts Migration and then edit the data connection to upload the driver.

                                                      @@ -161,7 +172,7 @@

                                                      Creating a Kerberos Authentication User for an MRS Security Cluster

                                                      To create a data connection for an MRS security cluster, do not use user admin. The admin user is the default management page user and cannot be used as the authentication user of the security cluster. To create an MRS user, perform the following steps:

                                                      For clusters of MRS 3.x:

                                                      1. Log in to MRS Manager as user admin.
                                                      2. Choose System > Permission > Security Policy > Password Policy. Click Add Password Policy and add a policy under which the password never expires.
                                                        • Set Password Policy Name to neverexp.
                                                        • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                        • Set Password Expiration Notification (Days) to 0.
                                                        • Retain the default values for other parameters.
                                                        -
                                                      3. Choose System > Permission > User. On the page displayed, click Create to add a dedicated user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                        • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                        • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                        +
                                                      4. Choose System > Permission > User. On the page displayed, click Create to add a dedicated human-machine user as the Kerberos authentication user and set the password policy to neverexp. Select the user group superGroup for the user, and assign all roles to the user.
                                                        • For clusters of MRS 3.1.0 or later, the user must at least have permissions of the Manager_viewer role to create data connections in Management Center. To perform database, table, and data operations on components, the user must also have user group permissions of the components.
                                                        • For clusters earlier than MRS 3.1.0, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                        • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                      5. Log in to Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                      6. Synchronize IAM users.
                                                        1. Log in to the MRS console.
                                                        2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                        3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                          • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                          • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                          @@ -169,7 +180,7 @@

                                                        For clusters of MRS 2.x or earlier:

                                                        1. Log in to the MRS Manager as user admin.
                                                        2. On FusionInsight Manager, choose System Settings and click Configure Password Policy to modify the password policy.
                                                          • Set Password Validity Period (Days) to 0, indicating that the password never expires.
                                                          • Set Password Expiration Notification (Days) to 0.
                                                          • Retain the default values for other parameters.
                                                          -
                                                        3. Choose System > Manage User. On the page displayed, add a dedicated user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                          • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                          • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                          +
                                                        4. Choose System > Manage User. On the page displayed, add a dedicated human-machine user as the Kerberos authentication user. Select the user group superGroup for the user, and assign all roles to the user.
                                                          • For clusters of MRS 2.x or earlier, the user must have permissions of the Manager_administrator or System_administrator role to create data connections in Management Center.
                                                          • A user with only the Manager_tenant or Manager_auditor permission cannot create connections.
                                                        5. Log in to MRS Manager as the new user and change the initial password. Otherwise, the connection fails to be created.
                                                        6. Synchronize IAM users.
                                                          1. Log in to the MRS console.
                                                          2. Choose Clusters > Active Clusters, select a running cluster, and click its name to go to its details page.
                                                          3. In the Basic Information area of the Dashboard page, click Synchronize on the right side of IAM User Sync to synchronize IAM users.
                                                            • When the policy of the user group to which the IAM user belongs changes from MRS ReadOnlyAccess to MRS CommonOperations, MRS FullAccess, or MRS Administrator, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD (System Security Services Daemon) cache of cluster nodes needs time to be updated. Then, submit a job. Otherwise, the job may fail to be submitted.
                                                            • When the policy of the user group to which the IAM user belongs changes from MRS CommonOperations, MRS FullAccess, or MRS Administrator to MRS ReadOnlyAccess, wait for 5 minutes until the new policy takes effect after the synchronization is complete because the SSSD cache of cluster nodes needs time to be updated.
                                                            @@ -179,7 +190,7 @@
                                                      diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1436.html b/docs/dataartsstudio/umn/dataartsstudio_01_1436.html index afbce07f3..9f8b8885c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1436.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1436.html @@ -5,7 +5,7 @@

                                                      For details about how to develop a batch processing job in single-task mode, see sections Developing an SQL Script, Configuring job parameters, Data Table, Testing and Saving the Job, and Downloading or Dumping a Script Execution Result.

                                                      Prerequisites

                                                      • A job has been created. For details, see Creating a Job.
                                                      • You have locked the job. Otherwise, you must click Lock so that you can develop the job. A job you create or import is locked by you by default. For details, see the lock function.
                                                      -

                                                      Developing an SQL Script

                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                      3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                      4. In the job directory, double-click the name of a single-task job to access the job development page.
                                                      5. On the right of the SQL editor, click Basic Info to configure basic information, properties, and advanced settings of the job. Table 1 lists the basic information, Table 2 lists the properties, and Table 3 lists the advanced settings. +

                                                        Developing an SQL Script

                                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                        2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                        3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                        4. In the job directory, double-click the name of a single-task job to access the job development page.
                                                        5. On the right of the SQL editor, click Basic Info to configure basic information, properties, and advanced settings of the job. Table 1 lists the basic information, Table 2 lists the properties, and Table 3 lists the advanced settings.
                                                          @@ -57,11 +59,16 @@

                                                          Click Add to add a tag to the job. You can also select a tag configured in Managing Job Tags.

                                                          + + +
                                                          Table 1 Basic job information

                                                          Parameter

                                                          Description

                                                          @@ -21,6 +21,8 @@

                                                          This parameter is available when Scheduling Identities is set to Yes.

                                                          User that executes the job. When you enter an executor, the job is executed by the executor. If the executor is left unspecified, the job is executed by the user who submitted the job for startup.

                                                          +
                                                          NOTE:

                                                          You can configure execution users only after you apply for the whitelist membership. To enable it, contact customer service or technical support.

                                                          +

                                                          Job Agency

                                                          @@ -42,7 +44,7 @@

                                                          Exclude Waiting Time from Instance Timeout Duration

                                                          Whether to exclude the wait time from the instance execution timeout duration

                                                          -

                                                          If you select this option, the time to wait before an instance starts running is excluded from the timeout duration. You can modify this setting on the Default Configuration page.

                                                          +

                                                          If you select this option, the time to wait before an instance starts running is excluded from the timeout duration. You can modify this setting in Default Configuration > Exclude Waiting Time from Instance Timeout Duration.

                                                          If you do not select this option, the time to wait before an instance starts running is included in the timeout duration.

                                                          Job Description

                                                          +

                                                          Description of the job

                                                          +
                                                          -
                                                          @@ -250,9 +294,9 @@
                                                        6. Enter one or more SQL statements in the SQL editor.
                                                          • SQL statements are separated by semicolons (;). If semicolons are used in other places but not used to separate SQL statements, escape them with backslashes (\). The following is an example:
                                                            select 1;
                                                             select * from a where b="dsfa\;";  --example 1\;example 2.
                                                            -
                                                          • RDS SQL does not support the begin ... commit transaction syntax. If necessary, use the start transaction ... commit transaction syntax.
                                                          • The script cannot be larger than 16 MB.
                                                          • The system date obtained by using an SQL statement is different from that obtained by using the database tool. The query result is stored in the database in the YYYY-MM-DD format, but the query result displayed on the page is in the converted format.
                                                          • When a user submits a Spark SQL script to MRS, the script is submitted to the tenant queue bound to the user by default. The bound queue is the queue corresponding to tenant role of the user. If there are multiple queues, the system preferentially selects a queue based on the queue priorities. To set a fixed queue for the user to submit scripts, log in to FusionInsight Manager, choose Tenant Resources > Dynamic Resource Plan, and click the Global User Policy tab. For details, see "Managing Global User Policies" in MapReduce Service (MRS) Usage Guide.
                                                          +
                                                        7. RDS SQL does not support the begin ... commit transaction syntax. If necessary, use the start transaction ... commit transaction syntax.
                                                        8. The script cannot be larger than 16 MB.
                                                        9. The system date obtained by using an SQL statement is different from that obtained by using the database tool. The query result is stored in the database in the YYYY-MM-DD format, but the query result displayed on the page is in the converted format.
                                                        10. When a user submits a Spark SQL script to MRS, the script is submitted to the tenant queue bound to the user by default. The bound queue is the queue corresponding to tenant role of the user. If there are multiple queues, the system preferentially selects a queue based on the queue priorities. To set a fixed queue for the user to submit scripts, log in to FusionInsight Manager, choose Tenant Resources > Dynamic Resource Plan, and click the Global User Policy tab. For details, see "Managing Global User Policies" in MapReduce Service (MRS) Usage Guide.
                                                        11. You can click Check Syntax to check the syntax of a Spark SQL or Hive SQL script. After the check is complete, you can view the check result in the lower part of the page.
                                                        12. -
                                                          To facilitate script development, DataArts Factory provides the following capabilities:
                                                          • The script editor supports the following shortcut keys, which improve the script development efficiency:
                                                            • F8: Run a script.
                                                            • F9: Stop running a script.
                                                            • Ctrl + /: Comment out or uncomment the line or code block at the cursor.
                                                            • Ctrl +Z: Cancel
                                                            • Ctrl + F: Search
                                                            • Ctrl + Shift + R: Replace
                                                            • Ctrl + X: Cut
                                                            • Ctrl + S: Save a script.
                                                            • Alt + mouse dragging: Select columns to edit a block.
                                                            • Ctrl + mouse click: Select multiple lines to edit or indent them together.
                                                            • Shift + Ctrl + K: Delete the current line.
                                                            • Ctrl + (or ): Move the cursor rightwards (or leftwards) by word.
                                                            • Ctrl + Home or Ctrl + End: Navigate to the beginning or end of the current file.
                                                            • Home or End: Navigate to the beginning or end of the current line.
                                                            • Ctrl + Shift + L: Double-click all the same character strings and add cursors to them to implement batch modification.
                                                            • Ctrl + D: Delete a line.
                                                            • Shift + Ctrl + U: Unlock a script.
                                                            • Ctrl + Alt + K: Select the word where the cursor resides.
                                                            • Ctrl + B: Format
                                                            • Ctrl + Shift + Z: Redo
                                                            • Ctrl + Enter: Execute the selected line or content.
                                                            • Ctrl + Alt + F: Flag
                                                            • Ctrl + Shift + K: Search for the previous one.
                                                            • Ctrl + K: Search for the next one.
                                                            • Ctrl + Backspace: Delete the word to the left of the cursor.
                                                            • Ctrl + Delete: Delete the word to the right of the cursor.
                                                            • Alt + Backspace: Delete all content from the beginning of the line to the cursor.
                                                            • Alt + Delete: Delete all content from the cursor to the end of the line.
                                                            • Alt + Shift-Left: Select all content from the beginning of the line to the cursor.
                                                            • Alt + Shift-Right: Select all content from the cursor to the end of the line.
                                                            +
                                                            To facilitate script development, DataArts Factory provides the following capabilities:
                                                            • The script editor supports the following shortcut keys, which improve the script development efficiency:
                                                              • F8: Run a script.
                                                              • F9: Stop running a script.
                                                              • Ctrl + /: Comment out or uncomment the line or code block at the cursor.
                                                              • Ctrl +Z: Cancel
                                                              • Ctrl + F: Search
                                                              • Ctrl + Shift + R: Replace
                                                              • Ctrl + X: Cut
                                                              • Ctrl + S: Save a script.
                                                              • Alt + mouse dragging: Select columns to edit a block.
                                                              • Ctrl + mouse click: Select multiple lines to edit or indent them together.
                                                              • Ctrl + (or ): Move the cursor rightwards (or leftwards) by word.
                                                              • Ctrl + Home or Ctrl + End: Navigate to the beginning or end of the current file.
                                                              • Home or End: Navigate to the beginning or end of the current line.
                                                              • Ctrl + Shift + L: Double-click all the same character strings and add cursors to them to implement batch modification.
                                                              • Ctrl + D: Delete a line.
                                                              • Shift + Ctrl + U: Unlock a script.
                                                              • Ctrl + Alt + K: Select the word where the cursor resides.
                                                              • Ctrl + B: Format
                                                              • Ctrl + Shift + Z: Redo
                                                              • Ctrl + Enter: Execute the selected line or content.
                                                              • Ctrl + Alt + F: Flag
                                                              • Ctrl + Shift + K: Search for the previous one.
                                                              • Ctrl + K: Search for the next one.
                                                              • Ctrl + Backspace: Delete the word to the left of the cursor.
                                                              • Ctrl + Delete: Delete the word to the right of the cursor.
                                                              • Alt + Backspace: Delete all content from the beginning of the line to the cursor.
                                                              • Alt + Delete: Delete all content from the cursor to the end of the line.
                                                              • Alt + Shift-Left: Select all content from the beginning of the line to the cursor.
                                                              • Alt + Shift-Right: Select all content from the cursor to the end of the line.
                                                            • System functions

                                                              To view the functions supported by this type of data connection, click System Functions on the right of the editor. You can double-click a function to the editor to use it.

                                                            • Script parameters

                                                              Enter script parameters in the SQL statement and click Parameter Setup in the right pane of the editor and then click Update from Script. You can also directly configure parameters and constants for the job script.

                                                              In the following script example, str1 indicates the parameter name. It can contain only letters, digits, hyphens (-), underscores (_), greater-than signs (>), and less-than signs (<), and can contain a maximum of 16 characters. The parameter name must be unique.

                                                              @@ -260,82 +304,81 @@ select * from a where b="dsfa\;"; --example 1\;example 2.
                                                            • Visualized reading of data tables to generate SQL statements

                                                              Click Data Tables on the right of the editor to display all the tables in the current database or schema. You can select tables and columns and click Generate SQL Statement in the lower right corner to generate an SQL statement, which you need to manually format.

                                                            -
                                                          • (Optional) In the upper part of the editor, click Format to format SQL statements.
                                                          • In the upper part of the editor, click Execute. If you need to execute some SQL statements separately, select the SQL statements first. After executing the SQL statements, view the execution history and result of the script in the lower part of the editor.

                                                            You can click View Log to view logs of the job.

                                                            +
                                                          • (Optional) In the upper part of the editor, click Format to format SQL statements.
                                                          • In the upper part of the editor, click Execute. If you need to execute some SQL statements separately, select the SQL statements first. After executing the SQL statements, view the execution history and result of the script in the lower part of the editor.
                                                            • You can click View Log to view logs of the job.
                                                            • When viewing the script execution result, you can double-click a field in any row to view the result details. You can copy the field name.
                                                            • You can control display of the script execution history by setting Script Execution History in Default Configuration to Myself or All users.
                                                            -
                                                          • Above the editor, click to save the job.
                                                          • +
                                                          • Above the editor, click Save to save the job.
                                                          -

                                                          Configuring job parameters

                                                          Job parameters can be globally used in any node in jobs. The procedure is as follows:

                                                          -

                                                          Click Parameter Setup on the right of the editor and set the parameters described in Table 4.

                                                          +

                                                          Configuring job parameters

                                                          Click Parameter Setup on the right of the editor and set the parameters described in Table 4.

                                                          -
                                                          Table 2 Properties of a single-task job

                                                          Property

                                                          +
                                                          @@ -70,28 +77,36 @@ + + + - - - + + + - - + + + + + + + + + + +
                                                          Table 2 Attributes of a batch processing single-task SQL job

                                                          Property

                                                          Description

                                                          DLI SQL properties

                                                          DLI Data Directory

                                                          +

                                                          Select the DLI data directory.

                                                          +
                                                          • Default DLI data directory dli
                                                          • Metadata catalog that has been created in LakeFormation associated with DLI.
                                                          +

                                                          Database Name

                                                          Select a database.

                                                          +

                                                          If you select the default DLI data directory dli, select a DLI database and tables.

                                                          +

                                                          If you select a metadata catalog that has been created in LakeFormation associated with DLI, select a LakeFormation database and tables.

                                                          Queue Name

                                                          The queue set in the SQL script is selected by default. You can change another one.

                                                          -
                                                          You can create a resource queue using either of the following methods:
                                                          • Click . On the displayed Queue Management page of DLI, create a resource queue.
                                                          • Go to the DLI console to create a resource queue.
                                                          +
                                                          You can create a resource queue using either of the following methods:
                                                          • Click . On the displayed Queue Management page of DLI, create a resource queue.
                                                          • Go to the DLI console to create a resource queue.

                                                          Record Dirty Data

                                                          Click to specify whether to record dirty data.

                                                          -
                                                          • If you select , dirty data will be recorded.
                                                          • If you do not select , dirty data will not be recorded.
                                                          +

                                                          Click to specify whether to record dirty data.

                                                          +
                                                          • If you select , dirty data will be recorded.
                                                          • If you do not select , dirty data will not be recorded.

                                                          DLI Environmental Variable

                                                          • The environment variable must start with dli.sql. or spark.sql.
                                                          • If the key of the environment variable is dli.sql.shuffle.partitions or dli.sql.autoBroadcastJoinThreshold, the environment variable cannot contain the greater than (>) or less than (<) sign.
                                                          • If a parameter with the same name is configured in both a job and a script, the parameter value configured in the job will overwrite that configured in the script.
                                                            NOTE:

                                                            When you run a DLI SQL script or test a DLI SQL single-task job in non-scheduling scenarios, the following parameters are enabled by default:

                                                            -
                                                            • spark.sql.adaptive.enabled: Adaptive Query Execution (AQE) is enabled so that Spark can dynamically optimize the query execution plan based on the characteristics of the data being processed and improve the performance by reducing the amount of data to be processed.
                                                            • spark.sql.adaptive.join.enabled: AQE is enabled for join operations. The optimal join algorithm is selected based on the data being processed to improve performance.
                                                            • spark.sql.adaptive.skewedJoin.enabled: AQE is enabled for skewed join operations. Skewed data can be automatically detected and the join algorithm is optimized accordingly to improve performance.
                                                            • spark.sql.mergeSmallFiles.enabled: Merging of small files is enabled. Small files can be merged into large ones, improving performance and shortening the processing time. In addition, less files need to be read from remote storage, and more local files can be used.
                                                            +
                                                          • The environment variable must start with hoodie., dli.sql., dli.ext., dli.jobs., spark.sql., or spark.scheduler.pool.
                                                          • If the environment variable is dli.sql.autoBroadcastJoinThreshold, the value must be an integer. If the environment variable is dli.sql.shuffle.partitions, the value must be a positive integer.
                                                          • If the key of the environment variable is dli.sql.shuffle.partitions or dli.sql.autoBroadcastJoinThreshold, the environment variable cannot contain the greater than (>) or less than (<) sign.
                                                          • If a parameter with the same name is configured in both a job and a script, the parameter value configured in the job will overwrite that configured in the script.
                                                            NOTE:

                                                            When you run a DLI SQL script or test a DLI SQL single-task job in non-scheduling scenarios, the following parameters are enabled by default:

                                                            +
                                                            • spark.sql.adaptive.enabled: Adaptive Query Execution (AQE) is enabled so that Spark can dynamically optimize the query execution plan based on the characteristics of the data being processed and improve the performance by reducing the amount of data to be processed.
                                                            • spark.sql.adaptive.join.enabled: AQE is enabled for join operations. The optimal join algorithm is selected based on the data being processed to improve performance.
                                                            • spark.sql.adaptive.skewedJoin.enabled: AQE is enabled for skewed join operations. Skewed data can be automatically detected and the join algorithm is optimized accordingly to improve performance.
                                                            • spark.sql.mergeSmallFiles.enabled: Merging of small files is enabled. Small files can be merged into large ones, improving performance and shortening the processing time. In addition, fewer files need to be read from remote storage, and more local files can be used.

                                                            If you do not want to use these functions, you can set the values of the preceding parameters to false.

                                                          @@ -144,8 +159,10 @@

                                                          MRS Job Name

                                                          MRS job name.

                                                          -

                                                          If the MRS job name is not set and the direct connection mode is selected, the node name can contain only letters, digits, hyphens (-), and underscores (_).

                                                          +

                                                          MRS job name. The system automatically sets this parameter based on the job name.

                                                          +

                                                          If the MRS job name is not set and the direct connection mode is selected, the node name can contain only letters, digits, hyphens (-), and underscores (_). A maximum of 64 characters are allowed, and Chinese characters are not allowed.

                                                          +
                                                          NOTE:

                                                          If you select an MRS API data connection, you cannot set the job name.

                                                          +

                                                          Data Connection

                                                          @@ -153,9 +170,17 @@

                                                          Select a data connection.

                                                          MRS Resource Queue

                                                          +

                                                          Select a created MRS resource queue.

                                                          +

                                                          This parameter is mandatory if Whether MRS Resource Queue Is Mandatory is set to Yes.

                                                          +
                                                          NOTE:

                                                          Select a queue you configured in the queue permissions of DataArts Security. If you set multiple resource queues for this node, the resource queue you select here has the highest priority.

                                                          +
                                                          +

                                                          Database

                                                          Select a database.

                                                          +

                                                          Select a database. If you select an MRS API connection, you cannot select a database.

                                                          Program Parameter

                                                          @@ -173,8 +198,8 @@

                                                          MRS Job Name

                                                          MRS job name.

                                                          -

                                                          If the MRS job name is not set and the direct connection mode is selected, the node name can contain only letters, digits, hyphens (-), and underscores (_).

                                                          +

                                                          MRS job name. The system automatically sets this parameter based on the job name.

                                                          +

                                                          If the MRS job name is not set and the direct connection mode is selected, the node name can contain only letters, digits, hyphens (-), and underscores (_). A maximum of 64 characters are allowed, and Chinese characters are not allowed.

                                                          Data Connection

                                                          @@ -187,6 +212,12 @@

                                                          Select a database.

                                                          MRS Resource Queue

                                                          +

                                                          Select a created MRS resource queue.

                                                          +

                                                          This parameter is mandatory if Whether MRS Resource Queue Is Mandatory is set to Yes.

                                                          +

                                                          Program Parameter

                                                          Set program parameters.

                                                          @@ -197,6 +228,19 @@

                                                          Doris SQL properties

                                                          +

                                                          Data Connection

                                                          +

                                                          Select a data connection.

                                                          +

                                                          Database

                                                          +

                                                          Select a database.

                                                          +
                                                          @@ -242,7 +286,7 @@

                                                          Yes

                                                          Policy for handling subsequent nodes if the current node fails

                                                          -
                                                          • End the current job execution plan: Execution of the current job will stop, and the job instance status will become Failed.
                                                          • Ignore the failure and set the job execution result to success: The failure of the current node will be ignored, and the next node will be executed. The job instance status will become Successful.
                                                          +
                                                          • End the current job execution plan: Execution of the current job will stop, and the job instance status will become Failed. If the job is scheduled periodically, subsequent periodic scheduling will run properly.
                                                          • Ignore the failure and set the job execution result to success: The failure of the current node will be ignored. The job instance status will become Successful. If the job is scheduled periodically, subsequent periodic scheduling will run properly.
                                                          Table 4 Job parameter setup

                                                          Module

                                                          +
                                                          - - - - - - - - - - - - - - - - - - - - - - - @@ -343,40 +386,40 @@ select * from a where b="dsfa\;"; --example 1\;example 2.

                                                          Click the Parameter Preview tab and configure the parameters listed in Table 5.

                                                          -
                                                          Table 4 Job parameter setup

                                                          Module

                                                          Description

                                                          +

                                                          Description

                                                          Variables

                                                          +

                                                          Variables

                                                          Add

                                                          +

                                                          Add

                                                          Click Add and enter the variable parameter name and parameter value in the text boxes.

                                                          -
                                                          • Parameter

                                                            Only letters, numbers, hyphens, and underscores (_) are allowed.

                                                            -
                                                          • Parameter Value
                                                            • The string type of parameter value is a character string, for example, str1.
                                                            • The numeric type of parameter value is a number or operation expression.
                                                            +

                                                          Click Add and enter the variable parameter name and parameter value in the text boxes.

                                                          +
                                                          • Parameter

                                                            Only letters, numbers, periods (.), hyphens (-), and underscores (_) are allowed.

                                                            +
                                                          • Parameter Value
                                                            • The string type of parameter value is a character string, for example, str1.
                                                            • The numeric type of parameter value is a number or operation expression.
                                                          -

                                                          After the parameter is configured, it is referenced in the format of ${parameter name} in the job.

                                                          +

                                                          After the parameter is configured, it is referenced in the format of ${Parameter name} in the job.

                                                          Edit Parameter Expression

                                                          +

                                                          Edit Parameter Expression

                                                          Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                          +

                                                          Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                          Modifying a Job

                                                          +

                                                          Modifying a Job

                                                          Change the parameter name or value in the corresponding text boxes.

                                                          +

                                                          Change the parameter name or value in the corresponding text boxes.

                                                          Mask

                                                          +

                                                          Mask

                                                          If the parameter value is a key, click to mask the value for security purposes.

                                                          +

                                                          If the parameter value is a key, click to mask the value for security purposes.

                                                          Delete

                                                          +

                                                          Delete

                                                          Click next to the parameter name and value text boxes to delete the job parameter.

                                                          +

                                                          Click next to the parameter name and value text boxes to delete the job parameter.

                                                          Constant Parameter

                                                          +

                                                          Constant Parameter

                                                          Add

                                                          +

                                                          Add

                                                          Click Add and enter the constant parameter name and parameter value in the text boxes.

                                                          -
                                                          • Parameter

                                                            Only letters, numbers, hyphens, and underscores (_) are allowed.

                                                            -
                                                          • Parameter Value
                                                            • The string type of parameter value is a character string, for example, str1.
                                                            • The numeric type of parameter value is a number or operation expression.
                                                            +

                                                          Click Add and enter the constant parameter name and parameter value in the text boxes.

                                                          +
                                                          • Parameter

                                                            Only letters, numbers, periods (.), hyphens (-), and underscores (_) are allowed.

                                                            +
                                                          • Parameter Value
                                                            • The string type of parameter value is a character string, for example, str1.
                                                            • The numeric type of parameter value is a number or operation expression.
                                                          -

                                                          After the parameter is configured, it is referenced in the format of ${parameter name} in the job.

                                                          +

                                                          After the parameter is configured, it is referenced in the format of ${Parameter name} in the job.

                                                          Edit Parameter Expression

                                                          +

                                                          Edit Parameter Expression

                                                          Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                          +

                                                          Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                          Modifying a Job

                                                          +

                                                          Modifying a Job

                                                          Modify the parameter name and parameter value in text boxes and save the modifications.

                                                          +

                                                          Modify the parameter name and parameter value in text boxes and save the modifications.

                                                          Delete

                                                          +

                                                          Delete

                                                          Click next to the parameter name and value text boxes to delete the job parameter.

                                                          +

                                                          Click next to the parameter name and value text boxes to delete the job parameter.

                                                          Workspace Environment Variables

                                                          +

                                                          Workspace Environment Variables

                                                          View the variables and constants that have been configured in the workspace.

                                                          +

                                                          View the variables and constants that have been configured in the workspace.

                                                          - - @@ -482,7 +548,7 @@ select * from a where b="dsfa\;"; --example 1\;example 2. - @@ -491,16 +557,16 @@ select * from a where b="dsfa\;"; --example 1\;example 2. - - - @@ -509,7 +575,7 @@ select * from a where b="dsfa\;"; --example 1\;example 2. - @@ -518,16 +584,38 @@ select * from a where b="dsfa\;"; --example 1\;example 2. - + + + + +
                                                          Table 5 Job parameter preview

                                                          Module

                                                          +
                                                          - - - - - - - - - - - - - @@ -388,17 +431,17 @@ select * from a where b="dsfa\;"; --example 1\;example 2.

                                                          If a parameter depends on the data generated during job execution, such data cannot be simulated and displayed in Parameter Preview.

                                                          -

                                                          Data Table

                                                          You can view tables of Hive SQL, DLI SQL, RDS SQL, and DWS SQLsingle-task batch processing jobs. On the Data Tables slide-out panel, you can select a table name to view the column names, field types, and descriptions in the table.

                                                          -
                                                          Figure 1 Viewing a data table
                                                          +

                                                          Data Table

                                                          You can view tables of Hive SQL, Spark SQL, DLI SQL, Doris SQL, RDS SQL, and DWS SQLsingle-task batch processing jobs. On the Data Tables slide-out panel, you can select a table name to view the column names, field types, and descriptions in the table.

                                                          +
                                                          Figure 1 Viewing a data table

                                                          Testing and Saving the Job

                                                          After configuring the job, perform the following operations:

                                                          -
                                                          1. Click to execute the job.

                                                            You can view the run logs of the job by clicking View Log.

                                                            +
                                                            1. Click to execute the job.

                                                              You can view the run logs of the job by clicking View Log.

                                                              -

                                                            2. After the job is executed, click to save the job configuration.

                                                              After the job is saved, a version is automatically generated and displayed in Versions. The version can be rolled back. If you save a job multiple times within a minute, only one version is recorded. If the intermediate data is important, you can click Save new version to save and add a version.

                                                              +

                                                            3. After the job is executed, click to save the job configuration.

                                                              After the job is saved, a version is automatically generated and displayed in Versions. The version can be rolled back. If you save a job multiple times within a minute, only one version is recorded. If the intermediate data is important, you can click Save new version to save and add a version.

                                                            -

                                                            Downloading or Dumping Script Execution Results

                                                            After a script is executed successfully, you can download or dump the execution result. By default, all users can download and dump the execution results of SQL scripts. If you do not want all users to have this permission, configure the permission by referring to Configuring a Data Export Policy.
                                                            • After executing a script, you can click Download on the Result tab page to download a CSV result file to a local path. You can view the download record on the Download Center page.
                                                            • After executing a script, you can click Dump on the Result tab page to dump a CSV and a JSON result file to OBS. For details, see Table 6.
                                                              • The dump function is supported only if the OBS service is available.
                                                              • Only the execution results of the query statements in SQL scripts can be dumped.
                                                              +

                                                              Downloading or Dumping Script Execution Results

                                                              After a script is executed successfully, you can download or dump the execution result. By default, all users can download and dump the execution results of SQL scripts. If you do not want all users to have this permission, configure the permission by referring to Configuring a Data Export Policy.
                                                              • After executing a script, you can click Download on the Result tab page to download a CSV result file to a local path. You can view the download record on the Download Center page.
                                                              • After executing a script, you can click Dump on the Result tab page to dump a CSV and a JSON result file to OBS. For details, see Table 6.
                                                                • The dump function is supported only if the OBS service is available.
                                                                • Only the execution results of SQL script query statements can be dumped.
                                                                • If the execution result of a download or dump SQL statement contains commas (,), newline characters, or other special characters, data may be disordered, the number of rows may increase, or other issues may occur.
                                                          Table 5 Job parameter preview

                                                          Module

                                                          Description

                                                          +

                                                          Description

                                                          Current Time

                                                          +

                                                          Current Time

                                                          This parameter is displayed only when Scheduling Type is set to Run once. The default value is the current time.

                                                          +

                                                          This parameter is displayed only when Scheduling Type is set to Run once. The default value is the current time.

                                                          Event Triggering Time

                                                          +

                                                          Event Triggering Time

                                                          This parameter is displayed only when Scheduling Type is set to Event-based. The default value is the time when an event is triggered.

                                                          +

                                                          This parameter is displayed only when Scheduling Type is set to Event-based. The default value is the time when an event is triggered.

                                                          Scheduling Period

                                                          +

                                                          Scheduling Period

                                                          This parameter is displayed only when Scheduling Type is set to Run periodically. The default value is the scheduling period.

                                                          +

                                                          This parameter is displayed only when Scheduling Type is set to Run periodically. The default value is the scheduling period.

                                                          Start Time

                                                          +

                                                          Start Time

                                                          This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the configured job execution time.

                                                          +

                                                          This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the configured job execution time.

                                                          Start Time

                                                          +

                                                          Start Time

                                                          This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the time when the periodic job scheduling starts.

                                                          +

                                                          This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the time when the periodic job scheduling starts.

                                                          Subsequent Instances

                                                          +

                                                          Subsequent Instances

                                                          Number of job instances scheduled.

                                                          +

                                                          Number of job instances scheduled.

                                                          • The default value is 1 when Scheduling Type is set to Run once.
                                                          • The default value is 1 when Scheduling Type is set to Event-based.
                                                          • When Scheduling Type is set to Run periodically:

                                                            If the number of instances exceeds 10, a maximum of 10 instances can be displayed, and the system displays message "A maximum of 10 instances are supported."

                                                          + + + + + + + +
                                                          Table 6 Dump parameters

                                                          Parameter

                                                          @@ -462,6 +505,29 @@ select * from a where b="dsfa\;"; --example 1\;example 2.
                                                          • UTF-8: default character set
                                                          • GB2312: recommended when the data to be exported contains Chinese character sets
                                                          • GBK: expanded based on and compatible with GB2312

                                                          Quotation Character

                                                          +

                                                          No

                                                          +

                                                          This parameter is available and can be set only when Data Format is csv.

                                                          +

                                                          Quotation characters are used to identify the beginning and end of text fields when exporting job results, and are used to separate fields.

                                                          +

                                                          Only one character can be set. The default value is double quotation marks (").

                                                          +

                                                          This is mainly used to handle data that contains spaces, special characters, or characters that are the same as the delimiter.

                                                          +

                                                          For details about the examples of using quotation characters and escape characters, see Example of Using Quotation Characters and Escape Characters.

                                                          +

                                                          Escape Character

                                                          +

                                                          No

                                                          +

                                                          This parameter is available and can be set only when Data Format is csv.

                                                          +

                                                          If special characters, such as quotation marks, need to be included in the exported results, they can be represented using escape characters (backslash \).

                                                          +

                                                          Only one character can be set. The default value is a backslash (\).

                                                          +

                                                          Common scenarios for using escape characters are:

                                                          +
                                                          • If there is a third quotation mark between two quotation marks, add an escape character before the third quotation mark to prevent the field content from being split.
                                                          • If there is already an escape character in the data content, add another escape character before the existing one to avoid the original character being used as an escape character.
                                                          +

                                                          For details about the examples of using quotation characters and escape characters, see Example of Using Quotation Characters and Escape Characters.

                                                          +
                                                          @@ -472,9 +538,9 @@ select * from a where b="dsfa\;"; --example 1\;example 2.

                                                          Maximum Number of Results That You Can View Online

                                                          Maximum Number of Results That You Can Download

                                                          +

                                                          Maximum Number/Size of Results That Can Be Downloaded

                                                          Maximum Number of Results That You Can Dump

                                                          +

                                                          Maximum Number/Size of Results That Can Be Dumped

                                                          1,000

                                                          1,000

                                                          +

                                                          1,000 records, less than 3MB

                                                          Unlimited

                                                          1,000

                                                          1,000

                                                          +

                                                          1,000 records, less than 3MB

                                                          10,000 records or 3 MB

                                                          DWS

                                                          +

                                                          GaussDB(DWS)

                                                          1,000

                                                          1,000

                                                          +

                                                          1,000 records, less than 3MB

                                                          10,000 records or 3 MB

                                                          1,000

                                                          1,000

                                                          +

                                                          1,000 records, less than 3MB

                                                          10,000 records or 3 MB

                                                          1,000

                                                          1,000

                                                          +

                                                          1,000 records, less than 3MB

                                                          Not supported

                                                          Doris

                                                          +

                                                          1,000

                                                          +

                                                          1,000 records, less than 3MB

                                                          +

                                                          1,000 records or 3 MB

                                                          +
                                                          +

                                                          Example of Using Quotation Characters and Escape Characters

                                                          • Usage of quotation characters and escape characters:
                                                            • Quotation character: used to identify and separate fields. The default value is double quotation marks (").
                                                            • Escape character: If special characters, such as quotation marks, need to be included in the exported results, they can be represented using escape characters (backslash \). The default value is a backslash (\).
                                                              1. To prevent the content of a field from being split when there is a third quotation character between two quotation characters, add an escape character before the third quotation character.
                                                              2. If there is already an escape character in the data content, add another escape character before the existing one to avoid the original character being used as an escape character.
                                                              +
                                                            +
                                                          • Example:

                                                            +

                                                            +

                                                            You can leave Quotation Character and Escape Character empty.

                                                            +

                                                            +

                                                            +

                                                            If you leave them empty, the downloaded .csv file contains two rows in Excel.

                                                            +

                                                            +

                                                            If you specify both of them, for example, enter double quotation marks ("), the downloaded file is as follows.

                                                            +

                                                            +
                                                          +
                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1509.html b/docs/dataartsstudio/umn/dataartsstudio_01_1509.html new file mode 100644 index 000000000..d640f4f00 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1509.html @@ -0,0 +1,120 @@ + + +

                                                          Redis Connection Parameters

                                                          +
                                                          +
                                                          + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                          Table 1 Redis connection

                                                          Parameter

                                                          +

                                                          Mandatory

                                                          +

                                                          Description

                                                          +

                                                          Data Connection Type

                                                          +

                                                          Yes

                                                          +

                                                          Redis is selected by default and cannot be changed.

                                                          +

                                                          Name

                                                          +

                                                          Yes

                                                          +

                                                          Name of the data connection to create. Data connection names can contain a maximum of 100 characters. They can contain only letters, digits, underscores (_), and hyphens (-).

                                                          +

                                                          Tag

                                                          +

                                                          No

                                                          +
                                                          Attribute of the data connection to create. Tags make management easier.
                                                          NOTE:

                                                          The tag name can contain only letters, digits, and underscores (_) and cannot start with an underscore (_) or contain more than 100 characters.

                                                          +
                                                          +
                                                          +

                                                          Applicable Modules

                                                          +

                                                          Yes

                                                          +

                                                          Select the modules for which this connection is available.

                                                          +

                                                          Basic and Network Connectivity Configuration

                                                          +

                                                          Manual

                                                          +

                                                          No

                                                          +

                                                          This parameter is available when a proxy is used for connection. You can select Cluster Name Mode or Connection String Mode.

                                                          +
                                                          • If you select Cluster Name Mode, select an existing cluster.
                                                          • If you select Connection String Mode, enter the IP address and port of the corresponding cluster.
                                                          +

                                                          MRS Cluster Name

                                                          +

                                                          Yes

                                                          +
                                                          The name of the MRS cluster. Select an MRS cluster that Hive belongs to. Only MRS clusters are supported. A Hadoop cluster can be selected only after it is managed by MRS. All the MRS clusters with the same project ID and enterprise project are displayed.
                                                          NOTE:

                                                          DataArts Studio does not support MRS clusters whose Kerberos encryption type is aes256-sha2,aes128-sha2, and only supports MRS clusters whose Kerberos encryption type is aes256-sha1,aes128-sha1.

                                                          +
                                                          +
                                                          +
                                                          If the connection fails after you select a cluster, check whether the MRS cluster can communicate with the CDM instance which functions as the agent. They can communicate with each other in the following scenarios:
                                                          • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in different regions, a public network or a dedicated connection is required. If the Internet is used for communication, ensure that an EIP has been bound to the CDM cluster, and the MRS cluster can access the Internet and the port has been enabled in the firewall rule.
                                                          • If the CDM cluster in the DataArts Studio instance and the MRS cluster are in the same region, VPC, subnet, and security group, they can communicate with each other by default. If they are in the same VPC but in different subnets or security groups, you must configure routing rules and security group rules. For details about how to configure routing rules, see "Adding Routes to a Route Table" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide. For details about how to configure security group rules, see "Security Group" > "Adding a Security Group Rule" in Virtual Private Cloud (VPC) x.x.x User Guide in Virtual Private Cloud (VPC) x.x.x Usage Guide.
                                                          • The MRS cluster and the DataArts Studio workspace belong to the same enterprise project. If they do not, you can modify the enterprise project of the workspace.
                                                          +
                                                          NOTE:

                                                          If an agent is connected to multiple MRS clusters and one of the MRS clusters is deleted or abnormal, connections to the other MRS clusters will be affected. Therefore, you are advised to connect an agent to only one MRS cluster.

                                                          +
                                                          +
                                                          +

                                                          Server List

                                                          +

                                                          Yes

                                                          +

                                                          This parameter is displayed when Manual is set to Connection String Mode.

                                                          +

                                                          One or more servers (server domain name/IP address:server port) separated by commas (,)

                                                          +

                                                          Example: 192.168.0.1:27017 or 192.168.0.2:27017

                                                          +

                                                          KMS Key

                                                          +

                                                          Yes

                                                          +
                                                          KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                          NOTE:
                                                          • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                          • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                          +
                                                          +
                                                          +

                                                          Agent

                                                          +

                                                          Yes

                                                          +

                                                          The CDM cluster provides an agent for communications between DataArts Studio and Redis. When creating a Redis connection, select a CDM cluster. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                          +

                                                          Data Source Authentication and Other Function Configuration

                                                          +

                                                          Authentication Method

                                                          +

                                                          Yes

                                                          +

                                                          This parameter is mandatory when Manual is set to Connection String Mode.

                                                          +

                                                          Select the authentication type of the database.

                                                          +

                                                          The options include SIMPLE and KERBEROS.

                                                          +

                                                          Password

                                                          +

                                                          Yes

                                                          +

                                                          Password for accessing the database. The password is required for creating a cluster.

                                                          +
                                                          +
                                                          +
                                                          + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1510.html b/docs/dataartsstudio/umn/dataartsstudio_01_1510.html new file mode 100644 index 000000000..8abf96d7c --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1510.html @@ -0,0 +1,143 @@ + + +

                                                          SAP HANA Connection Parameters

                                                          +
                                                          +
                                                          + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                          Table 1 SAP HANA connection

                                                          Parameter

                                                          +

                                                          Mandatory

                                                          +

                                                          Description

                                                          +

                                                          Data Connection Type

                                                          +

                                                          Yes

                                                          +

                                                          The value is fixed at RDS(SAP HANA).

                                                          +

                                                          Name

                                                          +

                                                          Yes

                                                          +

                                                          Name of the data connection to create. Data connection names can contain a maximum of 100 characters. They can contain only letters, digits, underscores (_), and hyphens (-).

                                                          +

                                                          Tag

                                                          +

                                                          No

                                                          +
                                                          Attribute of the data connection to create. Tags make management easier.
                                                          NOTE:

                                                          The tag name can contain only letters, digits, and underscores (_) and cannot start with an underscore (_) or contain more than 100 characters.

                                                          +
                                                          +
                                                          +

                                                          Applicable Modules

                                                          +

                                                          Yes

                                                          +

                                                          Select the modules for which this connection is available.

                                                          +

                                                          Basic and Network Connectivity Configuration

                                                          +

                                                          IP Address or Domain Name

                                                          +

                                                          Yes

                                                          +

                                                          Address for accessing the relational database data source. The value can be an IP address or a domain name.

                                                          +
                                                          • If the data source is RDS, you can obtain the address on the management console by performing the following operations:
                                                            1. Log in to the management console of the corresponding cloud service using the account you have obtained.
                                                            2. In the left navigation pane, choose Instances.
                                                            3. Click the name of an instance to enter the basic information page. In the Connection Information area, you can obtain the private IP address, domain name, and port number.
                                                            +
                                                          • If the data source is MySQL, PostgreSQL, or DM, you can obtain the access address from the database administrator.
                                                          +

                                                          Port

                                                          +

                                                          Yes

                                                          +

                                                          Port for accessing the relational database

                                                          +
                                                          • If the data source is RDS, you can obtain the address on the management console by performing the following operations:
                                                            1. Log in to the management console of the corresponding cloud service using the account you have obtained.
                                                            2. In the left navigation pane, choose Instances.
                                                            3. Click the name of an instance to enter the basic information page. In the Connection Information area, you can obtain the private IP address, domain name, and port number.
                                                            +
                                                          • If the data source is MySQL, PostgreSQL, or DM, you can obtain the access address from the database administrator.
                                                          +

                                                          KMS Key

                                                          +

                                                          Yes

                                                          +
                                                          KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                          NOTE:
                                                          • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                          • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                          +
                                                          +
                                                          +

                                                          Agent

                                                          +

                                                          Yes

                                                          +

                                                          DataArts Studio cannot be directly connected to non-fully managed services. A CDM cluster can provide an agent for DataArts Studio to communicate with non-fully-managed services. Therefore, you need to select a CDM cluster when creating an SAP HANA data connection. If no CDM cluster is available, create one first by referring to Creating a CDM Cluster.

                                                          +

                                                          Data Source Driver Configuration

                                                          +

                                                          Driver Name

                                                          +

                                                          Yes

                                                          +

                                                          Driver name

                                                          +
                                                          • com.mysql.jdbc.Driver: Select this driver name for RDS for MySQL or MySQL.
                                                          • org.postgresql.Driver: Select this driver name for RDS for PostgreSQL or PostgreSQL.
                                                          • com.microsoft.sqlserver.jdbc.SQLServerDriver: Select this driver name for RDS for SQL Server.
                                                          +

                                                          Driver Source

                                                          +

                                                          Yes

                                                          +

                                                          Source of the driver file

                                                          +

                                                          Driver File Path

                                                          +

                                                          Yes

                                                          +

                                                          This parameter is mandatory when Driver File Source is set to OBS path.

                                                          +

                                                          It specifies the OBS path where the driver file is located. You need to download a .jar driver file from the corresponding official website and upload it to OBS.

                                                          + +
                                                          NOTE:
                                                          • The OBS path of the driver file cannot contain Chinese characters.
                                                          • To update the driver, you must restart the CDM cluster in DataArts Migration and then edit the data connection to upload the driver.
                                                          +
                                                          +

                                                          Driver File

                                                          +

                                                          Yes

                                                          +

                                                          This parameter is mandatory when Driver Source is set to Local file.

                                                          +

                                                          You can download a driver file from the official driver website, and then click Select and upload the driver. Alternatively, you can select a driver that has been uploaded before.

                                                          +

                                                          Data Source Authentication and Other Function Configuration

                                                          +

                                                          Username

                                                          +

                                                          Yes

                                                          +

                                                          Username of the database. The username is required for creating a cluster.

                                                          +

                                                          Password

                                                          +

                                                          Yes

                                                          +

                                                          Password for accessing the database. The password is required for creating a cluster.

                                                          +
                                                          +
                                                          +
                                                          + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1582.html b/docs/dataartsstudio/umn/dataartsstudio_01_1582.html index b8546dc60..79ad85378 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1582.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1582.html @@ -8,21 +8,22 @@

                                                          Prerequisites

                                                          A template has been created. If no template is available, create one by referring to Configuring a Template.

                                                          -

                                                          Using Templates

                                                          • Use a script template for a Flink SQL script.
                                                            1. In the navigation pane on the DataArts Studio console, choose Data Development > Develop Script.
                                                            2. Right-click a script directory and select Create Flink SQL Script.
                                                            3. Click Template. In the slide-out pane, select a template, for example, 412_mobna. You can select multiple templates.
                                                              Figure 1 Using a script template
                                                              -

                                                              +

                                                              Using Templates

                                                              • Use a script template for a Flink SQL script.
                                                                1. In the navigation pane on the DataArts Studio console, choose Data Development > Develop Script.
                                                                2. Right-click a script directory and select Create Flink SQL Script.
                                                                3. Click Template. In the slide-out pane, select a template, for example, 412_mobna. You can select multiple templates.

                                                                  +
                                                                  Figure 1 Using a script template
                                                                4. Click Save to create the 412_test script.
                                                              • During the development of a pipeline job, use the Flink SQL script which uses a script template for the MRS Flink Job node.
                                                                1. In the navigation pane on the DataArts Factory console, choose Data Development > Develop Job.
                                                                2. Right-click a job directory and select Create Job to create a batch processing job in pipeline mode.
                                                                3. On the displayed data development page, drag an MRS Flink Job node to the canvas.
                                                                4. Select Flink SQL job for Job Type and select the Flink SQL script for Script Path.

                                                                  After the script is selected, the template parameters and values used by the script are automatically displayed.

                                                                  -
                                                                  Figure 2 Using the Flink SQL script
                                                                  +
                                                                  Figure 2 Using the Flink SQL script

                                                                -
                                                              • During the development of a pipeline job, use a parameter template in Program Parameter of the MRS Flink Job node.
                                                                1. Set MRS Cluster.
                                                                2. Program parameters are automatically displayed. Click Select Template and select a parameter template. You can also select multiple templates.
                                                                  The parameter names and values are automatically displayed.
                                                                  Figure 3 Using a parameter template for program parameters
                                                                  +
                                                                3. During the development of a pipeline job, use a parameter template in Program Parameter of the MRS Flink Job node.
                                                                  1. Set MRS Cluster.
                                                                  2. Program parameters are automatically displayed. Click Select Template and select a parameter template. You can also select multiple templates.
                                                                    The parameter names and values are automatically displayed.
                                                                    Figure 3 Using a parameter template for program parameters

                                                                  -
                                                                4. Use a script template in a single-task Flink SQL job.
                                                                  1. In the navigation pane on the DataArts Factory console, choose Data Development > Develop Job.
                                                                  2. Right-click a job directory and select Create Job to create a real-time processing job in single-task Flink SQL mode.
                                                                  3. Click Template. In the slide-out pane, select a template, for example, 412_mobna. You can select multiple templates.
                                                                    Figure 4 Using a script template in a single-task Flink SQL job.
                                                                    -

                                                                    +
                                                                  4. Use a script template in a single-task Flink SQL job.
                                                                    1. In the navigation pane on the DataArts Factory console, choose Data Development > Develop Job.
                                                                    2. Right-click a job directory and select Create Job to create a real-time processing job in single-task Flink SQL mode.
                                                                    3. Click Template. In the slide-out pane, select a template, for example, 412_mobna. You can select multiple templates.

                                                                      +
                                                                      Figure 4 Using a script template in a single-task Flink SQL job
                                                                      +

                                                                    -
                                                                  5. Use template parameters in a single-task Flink JAR job.
                                                                    1. In the navigation pane on the DataArts Factory console, choose Data Development > Develop Job.
                                                                    2. Right-click a job directory and select Create Job to create a real-time processing job in single-task Flink JAR mode.
                                                                    3. Set MRS Cluster.
                                                                    4. Program parameters are automatically displayed. Click Select Template and select a parameter template. You can also select multiple templates.
                                                                      The parameter names and values are automatically displayed.
                                                                      Figure 5 Using a script template in a single-task Flink JAR job.
                                                                      +
                                                                    5. Use template parameters in a single-task Flink JAR job.
                                                                      1. In the navigation pane on the DataArts Factory console, choose Data Development > Develop Job.
                                                                      2. Right-click a job directory and select Create Job to create a real-time processing job in single-task Flink JAR mode.
                                                                      3. Set MRS Cluster.
                                                                      4. Program parameters are automatically displayed. Click Select Template and select a parameter template. You can also select multiple templates.
                                                                        The parameter names and values are automatically displayed.
                                                                        Figure 5 Using a script template in a single-task Flink JAR job.

                                                                      @@ -35,3 +36,10 @@
                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1584.html b/docs/dataartsstudio/umn/dataartsstudio_01_1584.html index 081e2ab97..698d66864 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1584.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1584.html @@ -9,17 +9,17 @@
                                                          1. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                          2. Create an SQL script. This section uses the MRS Spark SQL script as an example.
                                                          3. Select a created data connection and database.
                                                          4. Compile the SQL script to obtain the maximum time data from table1.
                                                            select max(time) from table1
                                                          5. Save and submit the version. The maxtime script is created.

                                                          Creating a Pipeline Subjob

                                                          -
                                                          1. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                          2. Select a CDM Job node and configure the node properties.
                                                            Figure 1 Configuring CDM Job node properties
                                                            +
                                                            1. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                            2. Select a CDM Job node and configure the node properties.
                                                              Figure 1 Configuring CDM Job node properties

                                                              Select a CDM cluster and associate the node with an existing CDM job.

                                                              Configure the job parameters and add job parameter maxtime.

                                                              -
                                                              Figure 2 Configuring job parameters
                                                              +
                                                              Figure 2 Configuring job parameters

                                                            3. Save and submit the version. The subjob sub is created.

                                                            Creating a Pipeline Job

                                                            -
                                                            1. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                            2. Select an MRS Spark SQL node and a For Each node to execute the CDM subjob cyclically.
                                                            3. Configure properties of the MRS Spark SQL node and associate the node with the created maxtime script.
                                                              Figure 3 Configuring properties for the MRS Spark SQL node
                                                              +
                                                              1. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                              2. Select an MRS Spark SQL node and a For Each node to execute the CDM subjob cyclically.
                                                              3. Configure properties of the MRS Spark SQL node and associate the node with the created maxtime script.
                                                                Figure 3 Configuring properties for the MRS Spark SQL node

                                                                -
                                                              4. Configure properties of the For Each node and associate the node with the created CDM subjob.
                                                                Figure 4 Configuring properties for the For Each node
                                                                +
                                                              5. Configure properties of the For Each node and associate the node with the created CDM subjob.
                                                                Figure 4 Configuring properties for the For Each node

                                                                After associating the node with the created subjob sub, write a parameter expression.

                                                                #{Loop.current[0]}
                                                                @@ -27,9 +27,9 @@
                                                                #{Job.getNodeOutput("maxtime")}
                                                              6. Save and submit the version. The job is created.

                                                              Obtaining the Maximum Time Value from the CDM Job Using a Where Clause and Transferring the Value to the Destination Job

                                                              -
                                                              1. Open the created subjob.
                                                              2. Click next to the job name to go to the job configuration page.
                                                                Figure 5 Editing the CDM job
                                                                +
                                                                1. Open the created subjob.
                                                                2. Click next to the job name to go to the job configuration page.
                                                                  Figure 5 Editing the CDM job

                                                                  -
                                                                3. In the advanced attributes of the source job configuration, configure a where clause to obtain the data to be migrated. When the job is executed, the migration data obtained from the source will be replicated, exported, and imported to the destination.
                                                                  Figure 6 Configuring a where clause
                                                                  +
                                                                4. In the advanced attributes of the source job configuration, configure a where clause to obtain the data to be migrated. When the job is executed, the migration data obtained from the source will be replicated, exported, and imported to the destination.
                                                                  Figure 6 Configuring a where clause

                                                                  The where clause is as follows:

                                                                  dt > '${maxtime}'
                                                                  @@ -42,3 +42,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1620.html b/docs/dataartsstudio/umn/dataartsstudio_01_1620.html new file mode 100644 index 000000000..4e2880183 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1620.html @@ -0,0 +1,209 @@ + + +

                                                                  Rest Client Connection Parameters

                                                                  +
                                                                  +
                                                                  + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                                  Table 1 Rest Client connection

                                                                  Parameter

                                                                  +

                                                                  Mandatory

                                                                  +

                                                                  Description

                                                                  +

                                                                  Data Connection Type

                                                                  +

                                                                  Yes

                                                                  +

                                                                  The value is fixed at Rest Client.

                                                                  +

                                                                  Name

                                                                  +

                                                                  Yes

                                                                  +

                                                                  Name of the data connection to create. Data connection names can contain a maximum of 100 characters. They can contain only letters, digits, underscores (_), and hyphens (-).

                                                                  +

                                                                  Tag

                                                                  +

                                                                  No

                                                                  +
                                                                  Attribute of the data connection to create. Tags make management easier.
                                                                  NOTE:

                                                                  The tag name can contain only letters, digits, and underscores (_) and cannot start with an underscore (_) or contain more than 100 characters.

                                                                  +
                                                                  +
                                                                  +

                                                                  Applicable Modules

                                                                  +

                                                                  Yes

                                                                  +

                                                                  Select the modules for which this connection is available. The connection can be used in the selected modules.

                                                                  +

                                                                  Basic and Network Connectivity Configuration

                                                                  +

                                                                  Connection address prefix

                                                                  +

                                                                  Yes

                                                                  +

                                                                  This parameter is displayed when DataArts Migration is selected for Applicable Modules.

                                                                  +

                                                                  Prefix of the connection address. This prefix is automatically added when an API is called during a job test or execution. HTTPS supports only TLS 1.2.

                                                                  +

                                                                  Example: https://xxx.com/prefix

                                                                  +

                                                                  Default Header

                                                                  +

                                                                  Yes

                                                                  +

                                                                  This parameter is displayed when DataArts Migration is selected for Applicable Modules.

                                                                  +

                                                                  It specifies the default header parameter. This header is carried when an API is called. Example: {"Content-Type":"application/json"}

                                                                  +

                                                                  KMS Key

                                                                  +

                                                                  Yes

                                                                  +
                                                                  KMS key used to encrypt and decrypt data source authentication information. Select a default or custom key.
                                                                  NOTE:
                                                                  • When you use KMS for encryption through DataArts Studio or KPS for the first time, the default key dlf/default or kps/default is automatically generated. For more information about default keys, see "What Is a Default Master Key?" in Data Encryption Workshop FAQs.
                                                                  • Only symmetric keys are supported. Asymmetric keys are not supported.
                                                                  +
                                                                  +
                                                                  +

                                                                  Agent

                                                                  +

                                                                  Yes

                                                                  +

                                                                  This parameter is displayed when DataArts Migration is selected for Applicable Modules.

                                                                  +

                                                                  DataArts Studio cannot directly connect to non-fully managed services. An agent is required for DataArts Studio to communicate with non-fully managed services. A CDM cluster can function as an agent. If no CDM cluster is available, create one by referring to Creating a CDM Cluster.

                                                                  +

                                                                  Data Source Authentication and Other Function Configuration

                                                                  +

                                                                  Rest auth type

                                                                  +

                                                                  Yes

                                                                  +

                                                                  Authentication method. The following options are available:

                                                                  +
                                                                  • NONE: no authentication
                                                                  • BASIC_AUTH: basic authentication

                                                                    If the data source API supports username and password authentication, you can select this authentication type and configure the username and password used for authentication. When the data source is connected, the username and password are transferred to the RESTful address through the Basic Auth protocol for authentication. The format is {"Authorization":"Basic base64(username:password)"}.

                                                                    +
                                                                  • TOKEN_AUTH: token authentication (The token is static and never expires. Otherwise, jobs will fail if the token expires.)

                                                                    If the data source API supports token-based authentication, you can select this authentication type and set a fixed token for authentication. When the data source is connected, the token is transferred to the header for authentication. The format is {"Authorization":"Bearer <token>"}.

                                                                    +
                                                                  • OAUTH_CODE_GRANT Oauth 2.0 (Authorization Code): Oauth2.0 authentication

                                                                    In this mode, a username and a password are used to obtain an access token, which is used to access APIs.

                                                                    +
                                                                  +

                                                                  Username

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is BASIC_AUTH.

                                                                  +

                                                                  You can use #username to obtain the value and transfer it in the body and header.

                                                                  +

                                                                  Password

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is BASIC_AUTH.

                                                                  +

                                                                  You can use #password to obtain the value and transfer it in the body and header.

                                                                  +

                                                                  Token

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is TOKEN_AUTH.

                                                                  +

                                                                  You can use #token to obtain the value and transfer it in the body and header.

                                                                  +

                                                                  Auth request url

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is OAUTH_CODE_GRANT.

                                                                  +

                                                                  This parameter is available when Rest auth type is set to Oauth 2.0 (Authorization Code). This API supports OAuth 2.0. Authentication credentials are used to obtain a token. Before testing connections and jobs, call this API to obtain the token. In addition, the location, name, and value acquisition mode of the token carried in subsequent APIs are defined in the authentication token.

                                                                  +

                                                                  Example: https://xxx.com/auth/token

                                                                  +

                                                                  Auth request method

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is OAUTH_CODE_GRANT.

                                                                  +

                                                                  Authentication request method in OAuth 2.0 mode. The value can be GET or POST. This parameter is mandatory if Auth request url is set.

                                                                  +

                                                                  Example: GET

                                                                  +

                                                                  Auth request username

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is OAUTH_CODE_GRANT.

                                                                  +

                                                                  This parameter is mandatory for the Oauth 2.0 mode. You can use #authUsername to obtain the value of this parameter and enter it in the authHeader or authbody parameter.

                                                                  +

                                                                  Auth request password

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is OAUTH_CODE_GRANT.

                                                                  +

                                                                  This parameter is mandatory for the Oauth 2.0 mode. You can use #authPassword to obtain the value of this parameter and enter it in the authHeader or authbody parameter.

                                                                  +

                                                                  Auth request header

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is OAUTH_CODE_GRANT.

                                                                  +

                                                                  Request header for the Oauth 2.0 mode. The authentication account and password can be obtained through #authUsername and #authPassword.

                                                                  +

                                                                  Example: {"username": "#authUsername","password": "#authPassword","Content-Type":"application/json"}

                                                                  +

                                                                  Auth request body

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is OAUTH_CODE_GRANT.

                                                                  +

                                                                  Request body for the Oauth 2.0 mode. This parameter is unavailable when Auth request method is set to GET. The authentication account and password can be obtained through #authUsername and #authPassword.

                                                                  +

                                                                  Example: {"username": "#authUsername","password": "#authPassword"}

                                                                  +

                                                                  Auth request token

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is OAUTH_CODE_GRANT.

                                                                  +

                                                                  Authentication token, which can be obtained from the response body of the authentication API and carried in the connection and job test. The token can only be placed in the header. The value contains a parameter name and a parameter value. The parameter value can be a SpEL expression.

                                                                  +

                                                                  The following is an example:

                                                                  +

                                                                  The authentication response body is as follows:

                                                                  +

                                                                  {

                                                                  +

                                                                  "code" : 200,

                                                                  +

                                                                  "data" : {

                                                                  +

                                                                  "access_token" : "DSFSDFWE87WE9089W9EW9ER898WER9W89ER8",

                                                                  +

                                                                  "expired":1000

                                                                  +

                                                                  }

                                                                  +

                                                                  }

                                                                  +

                                                                  To obtain the value of access_token in Bearer <token> format, set the value of this parameter as follows:

                                                                  +

                                                                  NAME: Authentication

                                                                  +

                                                                  VALUE: 'Bearer ' + #response.data.access_token

                                                                  +

                                                                  Auth request token expired

                                                                  +

                                                                  No

                                                                  +

                                                                  This parameter is displayed when Rest auth type is OAUTH_CODE_GRANT.

                                                                  +

                                                                  Validity period of the authentication token, in seconds. The value can be an EL expression. The default value 0 indicates that the token is permanently valid.

                                                                  +

                                                                  Example 1: 300 indicates that the validity period is 300 seconds.

                                                                  +

                                                                  Example 2: #response.data.expired. Obtain the value of the expired attribute from the JSON string returned by the authentication API. The default unit is second. If the value is not of the int type, enter a validity period.

                                                                  +
                                                                  +
                                                                  +
                                                                  + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1628.html b/docs/dataartsstudio/umn/dataartsstudio_01_1628.html new file mode 100644 index 000000000..62c2d967d --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1628.html @@ -0,0 +1,128 @@ + + +

                                                                  YASHAN Link Parameters

                                                                  +

                                                                  Table 1 describes the YASHAN link parameters.

                                                                  +

                                                                  Do not change the password or user when the job is running. If you do so, the password will not take effect immediately and the job will fail.

                                                                  +
                                                                  + +
                                                                  + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                                  Table 1 YASHAN link parameters

                                                                  Parameter

                                                                  +

                                                                  Description

                                                                  +

                                                                  Example Value

                                                                  +

                                                                  Name

                                                                  +

                                                                  Link name, which should be defined based on the data source type, so it is easier to remember what the link is for

                                                                  +

                                                                  yashan_link

                                                                  +

                                                                  Database Server

                                                                  +

                                                                  IP address or domain name of the database to connect

                                                                  +

                                                                  Click Select next to the text box to obtain the list of instances.

                                                                  +

                                                                  192.168.0.1

                                                                  +

                                                                  Port

                                                                  +

                                                                  Port of the database to connect

                                                                  +

                                                                  1688

                                                                  +

                                                                  Database Name

                                                                  +

                                                                  Name of the database to connect

                                                                  +

                                                                  dbname

                                                                  +

                                                                  Username

                                                                  +

                                                                  Username used for accessing the database This account must have the permissions required to read and write data tables and metadata.

                                                                  +

                                                                  cdm

                                                                  +

                                                                  Password

                                                                  +

                                                                  Password of the user

                                                                  +

                                                                  -

                                                                  +

                                                                  Use Agent

                                                                  +

                                                                  The agent function will be unavailable soon and does not need to be configured.

                                                                  +

                                                                  -

                                                                  +

                                                                  Agent

                                                                  +

                                                                  The agent function will be unavailable soon and does not need to be configured.

                                                                  +

                                                                  -

                                                                  +

                                                                  Reference Sign

                                                                  +

                                                                  (Optional) Delimiter between the names of the referenced tables or columns. For details, see the product documentation of the corresponding database.

                                                                  +

                                                                  "

                                                                  +

                                                                  Driver Version

                                                                  +

                                                                  Different types of relational databases adapt to different drivers. For details, see How Do I Obtain a Driver?

                                                                  +

                                                                  -

                                                                  +

                                                                  Fetch Size

                                                                  +

                                                                  (Optional) Displayed when you click Show Advanced Attributes.

                                                                  +

                                                                  Number of rows obtained by each request. Set this parameter based on the data source and the job's data size. If the value is too large or too small, the job execution time may be affected.

                                                                  +

                                                                  1000

                                                                  +

                                                                  SSL Encryption

                                                                  +

                                                                  (Optional) Displayed when you click Show Advanced Attributes.

                                                                  +

                                                                  Select Yes if you want to enable SSL encrypted transmission.

                                                                  +

                                                                  Yes

                                                                  +

                                                                  Link Attributes

                                                                  +

                                                                  (Optional) Click Add to add the JDBC connector attributes of multiple specified data sources. For details, see the JDBC connector document of the corresponding database.

                                                                  +
                                                                  The following are some examples:
                                                                  • socketTimeout: JDBC connection timeout duration, in milliseconds
                                                                  • mysql.bool.type.transform: whether to parse tinyint(1) to a Boolean value during data reading from a MySQL database. The default value is true.
                                                                  +
                                                                  +

                                                                  socketTimeout=300

                                                                  +

                                                                  Link Secret Attributes

                                                                  +

                                                                  Custom secret attributes of the link

                                                                  +

                                                                  xxx=xxx

                                                                  +
                                                                  +
                                                                  +
                                                                  +
                                                                  + +
                                                                  + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1629.html b/docs/dataartsstudio/umn/dataartsstudio_01_1629.html new file mode 100644 index 000000000..1cba47cfb --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1629.html @@ -0,0 +1,143 @@ + + +

                                                                  From YASHAN

                                                                  +

                                                                  If the source link of a job is a YASHAN link, configure the source job parameters based on Table 1.

                                                                  + +
                                                                  + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                                  Table 1 Parameter description

                                                                  Type

                                                                  +

                                                                  Parameter

                                                                  +

                                                                  Description

                                                                  +

                                                                  Example Value

                                                                  +

                                                                  Basic parameters

                                                                  +

                                                                  Use SQL Statement

                                                                  +

                                                                  Whether you can use SQL statements to export data from a relational database

                                                                  +

                                                                  No

                                                                  +

                                                                  SQL Statement

                                                                  +

                                                                  When Use SQL Statement is set to Yes, enter an SQL statement here. CDM exports data based on the SQL statement.

                                                                  +
                                                                  NOTE:
                                                                  • SQL statements can only be used to query data. Join and nesting are supported, but multiple query statements are not allowed, for example, select * from table a; select * from table b.
                                                                  • With statements are not supported.
                                                                  • Comments, such as -- and /*, are not supported.
                                                                  • Addition, deletion, and modification operations are not supported, including but not limited to the following:
                                                                    • load data
                                                                    • delete from
                                                                    • alter table
                                                                    • create table
                                                                    • drop table
                                                                    • into outfile
                                                                    +
                                                                  • If the SQL statement is too long, the request fails to be delivered. If you continue to create a job, the system displays an error message indicating that the request is incorrect. In this case, you need to simplify or clear the SQL statement and try again.
                                                                  +
                                                                  +

                                                                  select id,name from sqoop.user;

                                                                  +

                                                                  Schema/Tablespace

                                                                  +

                                                                  Name of the schema or tablespace from which data will be extracted. This parameter is displayed when Use SQL Statement is set to No. Click the icon next to the text box to go to the page for selecting a schema or directly enter a schema or tablespace.

                                                                  +

                                                                  If the desired schema or tablespace is not displayed, check whether the login account has the permissions required to query metadata.

                                                                  +
                                                                  NOTE:
                                                                  The parameter value can contain wildcard characters (*), which is used to export all databases whose names start with a certain prefix or end with a certain suffix. For example:
                                                                  • SCHEMA* indicates that all databases whose names starting with SCHEMA are exported.
                                                                  • *SCHEMA indicates that all databases whose names ending with SCHEMA are exported.
                                                                  • *SCHEMA* indicates that all databases whose names containing SCHEMA are exported.
                                                                  +
                                                                  +
                                                                  +

                                                                  SCHEMA_E

                                                                  +

                                                                  Table Name

                                                                  +

                                                                  Name of the table from which data will be extracted. This parameter is displayed when Use SQL Statement is set to No. Click the icon next to the text box to go to the page for selecting the table or directly enter a table name.

                                                                  +

                                                                  If the desired table is not displayed, check whether the table exists or whether the login account has the permission to query metadata.

                                                                  +

                                                                  This parameter can be configured as a macro variable of date and time and a path name can contain multiple macro variables. When the macro variable of date and time works with a scheduled job, the incremental data can be synchronized periodically.

                                                                  +
                                                                  NOTE:

                                                                  If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                                  +
                                                                  +
                                                                  NOTE:
                                                                  The table name can contain wildcard characters (*), which is used to export all tables whose names start with a certain prefix or end with a certain suffix. The number and types of fields in the tables must be the same. The examples are as follows:
                                                                  • table* indicates that all tables whose names starting with table are exported.
                                                                  • *table indicates that all tables whose names ending with table are exported.
                                                                  • *table* indicates that all tables whose names containing table are exported.
                                                                  +
                                                                  +
                                                                  +

                                                                  table

                                                                  +

                                                                  Advanced attributes

                                                                  +

                                                                  WHERE Clause

                                                                  +

                                                                  WHERE clause used to specify the data extraction range. This parameter is displayed when Use SQL Statement is set to No. If this parameter is not set, the entire table is extracted.

                                                                  +

                                                                  You can set a date macro variable to extract data generated on a specific date.

                                                                  +
                                                                  NOTE:

                                                                  If you have configured a macro variable of date and time and schedule a CDM job through DataArts Studio DataArts Factory, the system replaces the macro variable of date and time with (Planned start time of the data development jobOffset) rather than (Actual start time of the CDM jobOffset).

                                                                  +
                                                                  +

                                                                  DS='${dateformat(yyyy-MM-dd,-1,DAY)}'

                                                                  +

                                                                  Retain One Decimal Place for Date Values

                                                                  +

                                                                  Whether to retain one decimal place for date values

                                                                  +

                                                                  No

                                                                  +

                                                                  Partition Column

                                                                  +

                                                                  This parameter is displayed when Use SQL Statement is set to No, indicating that a field used to split data during data extraction. CDM splits a job into multiple tasks based on this field and executes the tasks concurrently. Fields with data distributed evenly are used, such as the sequential number field.

                                                                  +

                                                                  Click the icon next to the text box to go to the page for selecting a field or directly enter a field.

                                                                  +
                                                                  NOTE:

                                                                  The following types of partition columns are supported: TINYINT, SMALLINT, INTEGER, BIGINT, REAL, FLOAT, DOUBLE, NUMERIC, DECIMAL, BIT, BOOLEAN, DATE, TIME, and TIMESTAMP. The partition column should have an index.

                                                                  +
                                                                  +

                                                                  id

                                                                  +

                                                                  Null in Partition Column

                                                                  +

                                                                  Whether the partition column can contain null values

                                                                  +

                                                                  During concurrent extraction, if the partition column does not contain null, set this parameter to No to improve performance. If you are not sure whether the partition column contains null, set this parameter to Yes to avoid data loss.

                                                                  +

                                                                  No

                                                                  +

                                                                  Split Job

                                                                  +

                                                                  If this parameter is set to Yes, the job is split into multiple subjobs based on the value of Job Split Field, and the subjobs are executed concurrently.

                                                                  +
                                                                  NOTE:

                                                                  This parameter and parameters Job Split Field, Minimum Split Field Value, Maximum Split Field Value, and Number of subjobs are available only when the destination link is a DLI or Hive link.

                                                                  +
                                                                  +

                                                                  No

                                                                  +

                                                                  Job Split Field

                                                                  +

                                                                  Field used to split a job into multiple subjobs for concurrent execution. This parameter is available when Split Job is set to Yes.

                                                                  +

                                                                  -

                                                                  +

                                                                  Minimum Split Field Value

                                                                  +

                                                                  Minimum value of Job Split Field during data extraction. This parameter is available when Split Job is set to Yes.

                                                                  +

                                                                  -

                                                                  +

                                                                  Maximum Split Field Value

                                                                  +

                                                                  Maximum value of Job Split Field during data extraction. This parameter is available when Split Job is set to Yes.

                                                                  +

                                                                  -

                                                                  +

                                                                  Number of subjobs

                                                                  +

                                                                  Number of subjobs split from a job for concurrent execution based on the data range specified by the minimum and maximum values of Job Split Field. This parameter is available when Split Job is set to Yes.

                                                                  +

                                                                  -

                                                                  +
                                                                  +
                                                                  +
                                                                  + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1820.html b/docs/dataartsstudio/umn/dataartsstudio_01_1820.html index 919ab5e4e..a2fbf2a98 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1820.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1820.html @@ -1,23 +1,26 @@

                                                                  Review Center

                                                                  -

                                                                  For a workspace in simple mode, you can set the reviewer for the scripts and jobs you submit.

                                                                  -

                                                                  Constraints

                                                                  • Only the admin of the current workspace can manage reviewers, including creating and deleting reviewers. The reviewer must be the admin of the current workspace or a user with the DARTS Administrator or Tenant Administrator permission.
                                                                  • If the current workspace uses the enterprise mode, no application can be submitted for approval.
                                                                  • You can only set whether to enable the review function and review jobs and scripts on the console.
                                                                  +

                                                                  For a workspace in simple mode, you can set the reviewer for the scripts and jobs you submit. In the review center, you can manage applications and configure and maintain reviewers for workspaces.

                                                                  +

                                                                  Constraints

                                                                  • Only the administrator of the current workspace or users with the DARTS Administrator or Tenant Administrator permissions can create, modify, and delete reviewers.
                                                                  • The reviewer must be the admin of the current workspace or a user with the DARTS Administrator or Tenant Administrator permission.
                                                                  • If the current workspace is in enterprise mode, you can publish tasks for approval, but cannot submit scripts or jobs for approval.
                                                                  • If the review function is enabled, the reviewer attribute must be added to the request body of related APIs. For details, see "Job Development APIs" in DataArts Studio Usage Guide.
                                                                  • You can only set whether to enable the review function and review jobs and scripts on the console.
                                                                  • If there are real-time pipeline jobs, review cannot be enabled.
                                                                  • If the review function is enabled, the review center is visible to both reviewers and request submitters. If the review function is disabled, the review center is visible only to the administrator of the current workspace or users with the DARTS Administrator or Tenant Administrator permissions.
                                                                  • The administrator of the current workspace or users with the DARTS Administrator or Tenant Administrator permissions cannot review their own service tickets.
                                                                  -

                                                                  Approval Management

                                                                  In the Review Center, you can view the applications you have submitted and their approval progress. If you are a reviewer, you can view the applications to be reviewed and the review history, manage reviewers, and enable or disable the review function.

                                                                  -
                                                                  • Pending Review
                                                                    1. In the left navigation pane, choose Review Center. In the right pane, click the Pending Review tab.

                                                                      On this page, you can view the applications that need to be reviewed.

                                                                      -
                                                                    2. Click Review in the Operation column to view the application details and review the application.
                                                                    3. After entering the approval comments, approve or reject the application based on the actual situation.
                                                                    -
                                                                  • Reviewed
                                                                    1. In the left navigation pane, choose Review Center. In the right pane, click the Reviewed tab.
                                                                    2. Click View Details in the Operation column to view the review records and application content as an admin.
                                                                    -
                                                                  • My Applications
                                                                    1. In the left navigation pane, choose Review Center. In the right pane, click the My Applications tab.
                                                                    2. Click View Details in the Operation column to view details about an application.
                                                                    3. Click Withdraw in the Operation column to withdraw an application. You can submit the application again after modifying it.
                                                                    -
                                                                  • Review Settings
                                                                    Figure 1 Review Settings tab
                                                                    -

                                                                    -
                                                                    1. In the left navigation pane, choose Review Center. In the right pane, click the Review Configuration tab.
                                                                    2. On the Review Configuration page, you can enable or disable the review function as an admin. If the current workspace has applications that have not been reviewed, the review function cannot be disabled.
                                                                      • Submit: If you enable this function, you must specify an approver when submitting a job or script. To enable review for specified jobs/scripts, you must enable this function.
                                                                      • Specify jobs/scripts requiring review: If you enable this function, you need to specify an approver only when submitting specified jobs or scripts. If you do not enable this function, all the jobs and scripts will require review. You need to configure the jobs or scripts that require approval. The procedure is as follows:

                                                                        Click the Jobs Requiring Review tab and then Add from Baseline. On the displayed page, select the priority jobs of the baseline task as the jobs that require review. Then click OK. The upstream jobs of the baseline also need to be approved.

                                                                        -

                                                                        Click the Scripts Requiring Review tab and select the jobs corresponding to the baseline. The scripts associated with the jobs will be displayed on this page.

                                                                        -

                                                                        If Specify jobs/scripts requiring review is disabled, all jobs and scripts need to be reviewed by default.

                                                                        -
                                                                      • If there are real-time pipeline jobs, Submit cannot be enabled.
                                                                      +

                                                                      Review Settings

                                                                      Only the administrator of the current workspace or users with the DARTS Administrator or Tenant Administrator permissions can set review options. When the review function is enabled, you can configure review options for jobs or scripts.

                                                                      +
                                                                      Figure 1 Review Settings tab
                                                                      +
                                                                      1. In the left navigation pane, choose Review Center. In the right pane, click the Review Configuration tab.
                                                                      2. Enable Review. Only the administrator of the current workspace or users with the DARTS Administrator or Tenant Administrator permissions can enable or disable the review function.
                                                                        • If you enable this function, you must specify a reviewer when submitting a job or script. If you disable this function, no jobs or scripts will need reviewing.
                                                                        • If the current workspace has applications that have not been reviewed, the review function cannot be disabled.
                                                                        -
                                                                      3. Under Reviewers, you can view information about the reviewers in the current workspace as an admin.
                                                                        1. Click Manage Reviewer.
                                                                        2. Locate the current workspace and click Edit in the Operation column.
                                                                        3. Next to Workspace Members, click Add.
                                                                        4. Search for and select a member account and select the admin role for it.
                                                                        5. Click OK.
                                                                        +
                                                                      4. You can set Review Configuration to any of the following:
                                                                        • All jobs/scripts: Review is enabled for all the jobs and scripts in the workspace.
                                                                        • Custom jobs/scripts: You need to add the jobs or scripts that need to be reviewed.

                                                                          Click the Jobs tab and click Add. On the displayed page, select the jobs for which you want to enable review. When a job is added, its associated scripts are automatically added. If you select a directory, only existing jobs in the directory are added. If you want to enable review for newly created jobs in the directory, you need to add them. Click OK.

                                                                          +

                                                                          You can delete the jobs that you have added.

                                                                          +

                                                                          Click the Scripts tab and click Add. In the displayed dialog box, select the scripts for which you want to enable review. If you select a directory, only existing scripts in the directory are added. If you want to enable review for newly created scripts in the directory, you need to add them. Click OK.

                                                                          +

                                                                          You can delete scripts that you have added.

                                                                          +
                                                                        • Baseline task jobs: Add jobs to be reviewed from baseline tasks.

                                                                          Click the Jobs tab and then Add. On the displayed page, select the priority jobs of the baseline task as the jobs that require review. Then click OK. The upstream jobs of the baseline task also need to be reviewed.

                                                                          +

                                                                          Click the Scripts tab and select the jobs corresponding to the baseline. The scripts associated with the jobs will be displayed on this page.

                                                                          +
                                                                        +
                                                                      5. In the Review Information area, you can configure the reviewer information on condition that you are the administrator of the current workspace or have the DARTS Administrator or Tenant Administrator permissions.
                                                                        1. Click Manage Reviewer.
                                                                        2. Locate the current workspace and click Edit in the Operation column.
                                                                        3. Next to Workspace Members, click Add.
                                                                        4. Search for and select a member account and select the admin role for it.
                                                                        5. Click OK. The configured reviewer information is automatically displayed.
                                                                      +
                                                                      +

                                                                      Review Management

                                                                      • If you have submitted a review application, you can view the review progress on the Review Center page.
                                                                        1. In the left navigation pane, choose Review Center. In the right pane, click the My Applications tab.
                                                                        2. Click View Details in the Operation column to view details about an application.
                                                                        3. Click Withdraw in the Operation column to withdraw an application. You can submit the application again after modifying it.
                                                                        +
                                                                      • You can view the applications pending your review.
                                                                        1. In the left navigation pane, choose Review Center. In the right pane, click the Pending Review tab. On this page, you can view the applications that need to be reviewed.
                                                                        2. Click Review in the Operation column to view the application details and review the application.
                                                                        3. Enter comments and approve or reject the application.
                                                                        +
                                                                      • You can view the applications that you have reviewed.
                                                                        1. In the left navigation pane, choose Review Center. In the right pane, click the Reviewed tab. On this page, you can view the applications that you have reviewed.
                                                                        2. Click View Details in the Operation column to view the review history and content of an application.
                                                                      @@ -27,3 +30,10 @@
                                                                  + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1821.html b/docs/dataartsstudio/umn/dataartsstudio_01_1821.html index a525233be..01c8c1b6d 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1821.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1821.html @@ -7,7 +7,7 @@

                                                                  Download Center

                                                                  • The download records age out on a regular basis. When aged out, download records and the data dumped to OBS are deleted.
                                                                  • Operators can view only their own download records. Workspace admins can view all download records in the current workspace.

                                                                  On the Download Center page, you can centrally manage the execution results of SQL scripts. You can view and delete the download results, and view, download, and delete the dump results.

                                                                  -
                                                                  Figure 1 Download Center
                                                                  +
                                                                  Figure 1 Download Center

                                                                  • Set the default OBS path.

                                                                    The workspace admin can set the default OBS path for dump for the current workspace.

                                                                    @@ -15,7 +15,7 @@
                                                                5. Click OK.
                                                              3. View the script execution result.
                                                                1. In the left navigation pane on the DataArts Factory console, choose Download Center.
                                                                2. View the file name, operator, operation time, operation type, task status, and OBS path of local download tasks and asynchronous dump tasks.

                                                                  You can view the dump task download failure records.

                                                                  -
                                                                3. Click in the Operation column to download data from the OBS path.
                                                                4. Click in the Operation column to delete download and dump records.

                                                                  When you click Delete, a message is displayed indicating that the record cannot be downloaded after being deleted. Click OK.

                                                                  +
                                                                5. Click in the Operation column to download data from the OBS path.
                                                                6. Click in the Operation column to delete download and dump records.

                                                                  When you click Delete, a message is displayed indicating that the record cannot be downloaded after being deleted. Click OK.

                                                              4. Filter records by search criteria.

                                                                You can filter records by operation time, job name, OBS path, operator, operation type, and task status. You can enter a keyword for fuzzy search.

                                                              5. @@ -27,3 +27,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1822.html b/docs/dataartsstudio/umn/dataartsstudio_01_1822.html index 9a48bd6c3..521d72203 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1822.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1822.html @@ -2,7 +2,7 @@

                                                                Operation History

                                                                You can view historical operations on the Operation History page. The system stores data for a maximum of three months and automatically deletes older data.

                                                                -
                                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                3. In the left navigation pane of the DataArts Factory console, choose Monitoring > Operation History.
                                                                4. You can perform the following operations on this page:
                                                                  • Filter out historical operations in a specified time period.
                                                                  • Filter out historical operations related to job names or node names by involved object.
                                                                  • Perform a fuzzy search of historical operations.
                                                                  • Filter out historical operations by operation object, operation type, operators, or status.
                                                                  +
                                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                  2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                  3. In the left navigation pane of the DataArts Factory console, choose Monitoring > Operation History.
                                                                  4. You can perform the following operations on this page:
                                                                    • Filter out historical operations in a specified time period.
                                                                    • Filter out historical operations related to job names or node names by involved object.
                                                                    • Perform a fuzzy search of historical operations.
                                                                    • Filter out historical operations by operation object, operation type, operators, or status.
                                                                diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1823.html b/docs/dataartsstudio/umn/dataartsstudio_01_1823.html index 1e4033823..9659db356 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1823.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1823.html @@ -1,95 +1,103 @@ -

                                                                Developing a Real-Time Processing Single-Task Flink SQL Job

                                                                +

                                                                Developing a Real-Time Processing Single-Task MRS Flink SQL Job

                                                                This section describes how to develop and configure a job.

                                                                For details about how to develop a real-time processing Flink SQL job in single-task mode, see sections Developing an SQL Script, Configuring Job Parameters, Saving a Job, and Templates.

                                                                Prerequisites

                                                                • You have created a job by referring to Creating a Job.
                                                                • You have locked the job. Otherwise, you must click Lock so that you can develop the job. A job you create or import is locked by you by default. For details, see the lock function.
                                                                -

                                                                Developing an SQL Script

                                                                1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                4. In the job directory, double-click the name of a single-task job to access the job development page.
                                                                5. On the right of the SQL editor, click Basic Info to configure basic information, properties, and advanced settings of the job. Table 1 lists the basic information, Table 2 lists the properties, and Table 3 lists the advanced settings. -
                                                                  Table 1 Basic job information

                                                                  Parameter

                                                                  +

                                                                  Developing an SQL Script

                                                                  1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                  2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                  3. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                  4. In the job directory, double-click the name of a single-task job to access the job development page.
                                                                  5. On the right of the SQL editor, click Basic Info to configure basic information of the job. Table 1 provides the basic information about the single-task MRS Flink SQL job. +
                                                                    - - - - - - - - - - - - - - - - - + + +
                                                                    Table 1 Basic job information

                                                                    Parameter

                                                                    Description

                                                                    +

                                                                    Description

                                                                    Owner

                                                                    +

                                                                    Owner

                                                                    An owner configured during job creation is automatically matched. This parameter value can be modified.

                                                                    +

                                                                    An owner configured during job creation is automatically matched. This parameter value can be modified.

                                                                    Executor

                                                                    +

                                                                    Executor

                                                                    This parameter is available when Scheduling Identities is set to Yes.

                                                                    +

                                                                    This parameter is available when Scheduling Identities is set to Yes.

                                                                    User that executes the job. When you enter an executor, the job is executed by the executor. If the executor is left unspecified, the job is executed by the user who submitted the job for startup.

                                                                    +
                                                                    NOTE:

                                                                    You can configure execution users only after you apply for the whitelist membership. To enable it, contact customer service or technical support.

                                                                    +

                                                                    Job Agency

                                                                    +

                                                                    Job Agency

                                                                    This parameter is available when Scheduling Identities is set to Yes.

                                                                    +

                                                                    This parameter is available when Scheduling Identities is set to Yes.

                                                                    After an agency is configured, the job interacts with other services as an agency during job execution.

                                                                    Priority

                                                                    +

                                                                    Priority

                                                                    Priority configured during job creation is automatically matched. This parameter value can be modified.

                                                                    +

                                                                    Priority configured during job creation is automatically matched. This parameter value can be modified.

                                                                    Execution Timeout

                                                                    +

                                                                    Execution Timeout

                                                                    Timeout of the job instance. If this parameter is set to 0 or is not set, this parameter does not take effect. If the notification function is enabled for the job and the execution time of the job instance exceeds the preset value, the system sends a specified notification, and the job keeps running.

                                                                    +

                                                                    Timeout of the job instance. If this parameter is set to 0 or is not set, this parameter does not take effect. If the notification function is enabled for the job and the execution time of the job instance exceeds the preset value, the system sends a specified notification, and the job keeps running.

                                                                    Exclude Waiting Time from Instance Timeout Duration

                                                                    +

                                                                    Exclude Waiting Time from Instance Timeout Duration

                                                                    Whether to exclude the wait time from the instance execution timeout duration

                                                                    -

                                                                    If you select this option, the time to wait before an instance starts running is excluded from the timeout duration. You can modify this setting on the Default Configuration page.

                                                                    +

                                                                    Whether to exclude the wait time from the instance execution timeout duration

                                                                    +

                                                                    If you select this option, the time to wait before an instance starts running is excluded from the timeout duration. You can modify this setting in Default Configuration > Exclude Waiting Time from Instance Timeout Duration.

                                                                    If you do not select this option, the time to wait before an instance starts running is included in the timeout duration.

                                                                    Custom Parameter

                                                                    +

                                                                    Custom Parameter

                                                                    Set the name and value of the parameter.

                                                                    +

                                                                    Set the name and value of the parameter.

                                                                    Job Tag

                                                                    +

                                                                    Job Tag

                                                                    Configure job tags to manage jobs by category.

                                                                    +

                                                                    Configure job tags to manage jobs by category.

                                                                    Click Add to add a tag to the job. You can also select a tag configured in Managing Job Tags.

                                                                    Job Description

                                                                    +

                                                                    Description of the job

                                                                    +
                                                                    -
                                                                    Table 2 Properties of a single-task job

                                                                    Property

                                                                    +
                                                                    - - - - - - - - - - - - - - - - - -
                                                                    Table 2 Attributes of the real-time processing single-task MRS Flink SQL job

                                                                    Property

                                                                    Description

                                                                    +

                                                                    Description

                                                                    Flink SQL properties

                                                                    +

                                                                    Flink SQL properties

                                                                    Flink Job Name

                                                                    +

                                                                    Flink Job Name

                                                                    Enter the Flink job name.

                                                                    +

                                                                    Enter the Flink job name.

                                                                    The name is automatically generated in Workspace-Job name format.

                                                                    -
                                                                    NOTE:

                                                                    It can contain only letters, digits, hyphens (-), and underscores. A maximum of 64 characters are allowed.

                                                                    +
                                                                    NOTE:

                                                                    It can contain only letters, digits, hyphens (-), and underscores. A maximum of 64 characters are allowed, and Chinese characters are not allowed.

                                                                    MRS Cluster

                                                                    +

                                                                    MRS Cluster

                                                                    Select an MRS cluster.

                                                                    +

                                                                    Select an MRS cluster.

                                                                    NOTE:

                                                                    Currently, jobs with a single Flink SQL node support MRS 3.2.0-LTS.1 and later versions.

                                                                    Program Parameter

                                                                    +

                                                                    Program Parameter

                                                                    Set the job running parameters.

                                                                    +

                                                                    Set the job running parameters. This parameter is displayed only after an MRS cluster is selected.

                                                                    (Optional) Configure optimization parameters such as threads, memory, and vCPUs for the job to optimize resource usage and improve job execution performance.

                                                                    -
                                                                    CAUTION:

                                                                    You can query historical checkpoints and select a specified checkpoint to start a real-time Flink SQL job. To make a Flink checkpoint take effect, configure the following two parameters:

                                                                    +
                                                                    CAUTION:
                                                                    You can query historical checkpoints and select a specified checkpoint to start a real-time Flink SQL job. To make a Flink checkpoint take effect, configure the following two parameters:
                                                                    Figure 1 Configuring program parameters
                                                                    +
                                                                    • Checkpoint interval:

                                                                      -yD: execution.checkpointing.interval=1000

                                                                    • Number of reserved checkpoints:

                                                                      -yD: state.checkpoints.num-retained=10

                                                                      When querying the checkpoint list, enter parameter -s and click the parameter value text box. The parameter value will be automatically displayed.

                                                                      @@ -98,70 +106,71 @@
                                                                      NOTE:

                                                                      This parameter is mandatory if the cluster version is MRS 1.8.7 or later than MRS 2.0.1.

                                                                      Click Select Template and select a parameter template. You can also select multiple templates. For details about how to create templates, see Configuring a Template.

                                                                      -

                                                                      For details about the parameters of MRS Flink jobs, see Managing an Existing Cluster > Job Management > Running a Flink Job in MapReduce Service (MRS) User Guide.

                                                                      +

                                                                      For details about the parameters of MRS Flink jobs, see Managing an Existing Cluster > Job Management > Running a Flink Job in MapReduce Service (MRS) User Guide.

                                                                    Flink Job Parameter

                                                                    +

                                                                    Flink Job Parameter

                                                                    Set the parameters for the Flink job.

                                                                    +

                                                                    Set the parameters for the Flink job.

                                                                    Variables required for executing the Flink job. These variables are specified by the functions in the Hive script. Multiple parameters are separated by spaces.

                                                                    MRS Resource Queue

                                                                    +

                                                                    MRS Resource Queue

                                                                    Select a created MRS resource queue.

                                                                    +

                                                                    Select a created MRS resource queue.

                                                                    +

                                                                    This parameter is mandatory if Whether MRS Resource Queue Is Mandatory is set to Yes.

                                                                    Select a queue you configured in the queue permissions of DataArts Security. If you set multiple resource queues for this node, the resource queue you select here has the highest priority.

                                                                    Rerun Policy

                                                                    +

                                                                    Rerun Policy

                                                                    • Rerun from the previous checkpoint
                                                                    • Rerun the job
                                                                    +
                                                                    • Rerun from the previous checkpoint
                                                                    • Rerun the job

                                                                    Input Data Path

                                                                    +

                                                                    Input Data Path

                                                                    Set the input data path. You can select an HDFS or OBS path.

                                                                    +

                                                                    Set the input data path. You can select an HDFS or OBS path.

                                                                    Output Data Path

                                                                    +

                                                                    Output Data Path

                                                                    Set the output data path. You can select an HDFS or OBS path.

                                                                    +

                                                                    Set the output data path. You can select an HDFS or OBS path.

                                                                    -
                                                                    Table 3 Advanced Settings

                                                                    Parameter

                                                                    +
                                                                    - - - - - - - - - - -
                                                                    Table 3 Advanced Settings

                                                                    Parameter

                                                                    Mandatory

                                                                    +

                                                                    Mandatory

                                                                    Description

                                                                    +

                                                                    Description

                                                                    Job Status Polling Interval (s)

                                                                    +

                                                                    Job Status Polling Interval (s)

                                                                    Yes

                                                                    +

                                                                    Yes

                                                                    Set the interval at which the system checks whether the job is complete. The interval can range from 30s to 60s, or 120s, 180s, 240s, or 300s.

                                                                    +

                                                                    Set the interval at which the system checks whether the job is complete. The interval can range from 30s to 60s, or 120s, 180s, 240s, or 300s.

                                                                    During job execution, the system checks the job status at the configured interval.

                                                                    Maximum Wait Time

                                                                    +

                                                                    Maximum Wait Time

                                                                    Yes

                                                                    +

                                                                    Yes

                                                                    Set the timeout interval for the job. If the job is not complete within the timeout interval and retry is enabled, the job will be executed again.

                                                                    +

                                                                    Set the timeout interval for the job. If the job is not complete within the timeout interval and retry is enabled, the job will be executed again.

                                                                    NOTE:

                                                                    If the job is in starting state and fails to start, it will fail upon timeout.

                                                                    Retry upon Failure

                                                                    +

                                                                    Retry upon Failure

                                                                    Yes

                                                                    +

                                                                    Yes

                                                                    Whether to re-execute the job if it fails

                                                                    +

                                                                    Whether to re-execute the job if it fails

                                                                    • Yes: The job will be re-executed if it fails. Configure the following parameters:
                                                                      • Retry upon Timeout
                                                                      • Maximum Retries
                                                                      • Retry Interval (seconds)
                                                                    • No: The job will not be re-executed if it fails. This is the default setting.
                                                                      NOTE:

                                                                      If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                                      If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                                      @@ -175,88 +184,87 @@
                                                                    • Enter one or more SQL statements in the SQL editor.
                                                                      • SQL statements are separated by semicolons (;). If semicolons are used in other places but not used to separate SQL statements, escape them with backslashes (\). The following is an example:
                                                                        select 1;
                                                                         select * from a where b="dsfa\;";  --example 1\;example 2.
                                                                        -
                                                                      • The script cannot be larger than 16 MB.
                                                                      • The system date obtained by using an SQL statement is different from that obtained by using the database tool. The query result is stored in the database in the YYYY-MM-DD format, but the query result displayed on the page is in the converted format.
                                                                      +
                                                                    • The script cannot be larger than 16 MB.
                                                                    • The system date obtained by using an SQL statement is different from that obtained by using the database tool. The query result is stored in the database in the YYYY-MM-DD format, but the query result displayed on the page is in the converted format.
                                                                    • You can click Check Syntax to check the syntax of Flink SQL jobs. Above the editor, click Check Syntax to verify the semantics of SQL statements. After the check is complete, you can view the check result in the lower part of the page.
                                                                    • When viewing the script execution result, you can double-click a field in any row to view the result details. You can copy the field name.
                                                                    • You can control display of the script execution history by setting Script Execution History in Default Configuration to Myself or All users.
                                                                    -
                                                                    To facilitate script development, DataArts Factory provides the following capabilities:
                                                                    • The script editor supports the following shortcut keys, which improve the script development efficiency:
                                                                      • F8: Run a script.
                                                                      • F9: Stop running a script.
                                                                      • Ctrl + /: Comment out or uncomment the line or code block where the cursor resides.
                                                                      • Ctrl + Z: Undo an action.
                                                                      • Ctrl + F: Search for information.
                                                                      • Ctrl + Shift + R: Replace
                                                                      • Ctrl + X: Cut
                                                                      • Ctrl + S: Save a script.
                                                                      • Alt + mouse dragging: Select columns to edit a block.
                                                                      • Ctrl + mouse click: Select multiple lines to edit or indent them together.
                                                                      • Shift + Ctrl + K: Delete the current line.
                                                                      • Ctrl + (or ): Move the cursor rightwards (or leftwards) by word.
                                                                      • Ctrl + Home or Ctrl + End: Navigate to the beginning or end of the current file.
                                                                      • Home or End: Navigate to the beginning or end of the current line.
                                                                      • Ctrl + Shift + L: Double-click all the same character strings and add cursors to them to implement batch modification.
                                                                      • Ctrl + D: Delete a line.
                                                                      • Shift + Ctrl + U: Unlock a script.
                                                                      • Ctrl + Alt + K: Select the word where the cursor resides.
                                                                      • Ctrl + B: Format
                                                                      • Ctrl + Shift + Z: Redo
                                                                      • Ctrl + Enter: Execute the selected line or content.
                                                                      • Ctrl + Alt + F: Flag
                                                                      • Ctrl + Shift + K: Search for the previous one.
                                                                      • Ctrl + K: Search for the next one.
                                                                      • Ctrl + Backspace: Delete the word to the left of the cursor.
                                                                      • Ctrl + Delete: Delete the word to the right of the cursor.
                                                                      • Alt + Backspace: Delete all content from the beginning of the line to the cursor.
                                                                      • Alt + Delete: Delete all content from the cursor to the end of the line.
                                                                      • Alt + Shift-Left: Select all content from the beginning of the line to the cursor.
                                                                      • Alt + Shift-Right: Select all content from the cursor to the end of the line.
                                                                      +
                                                                      To facilitate script development, DataArts Factory provides the following capabilities:
                                                                      • The script editor supports the following shortcut keys, which improve the script development efficiency:
                                                                        • F8: Run a script.
                                                                        • F9: Stop running a script.
                                                                        • Ctrl + /: Comment out or uncomment the line or code block where the cursor resides.
                                                                        • Ctrl + Z: Undo an action.
                                                                        • Ctrl + F: Search for information.
                                                                        • Ctrl + Shift + R: Replace
                                                                        • Ctrl + X: Cut
                                                                        • Ctrl + S: Save a script.
                                                                        • Alt + mouse dragging: Select columns to edit a block.
                                                                        • Ctrl + mouse click: Select multiple lines to edit or indent them together.
                                                                        • Ctrl + (or ): Move the cursor rightwards (or leftwards) by word.
                                                                        • Ctrl + Home or Ctrl + End: Navigate to the beginning or end of the current file.
                                                                        • Home or End: Navigate to the beginning or end of the current line.
                                                                        • Ctrl + Shift + L: Double-click all the same character strings and add cursors to them to implement batch modification.
                                                                        • Ctrl + D: Delete a line.
                                                                        • Shift + Ctrl + U: Unlock a script.
                                                                        • Ctrl + Alt + K: Select the word where the cursor resides.
                                                                        • Ctrl + B: Format
                                                                        • Ctrl + Shift + Z: Redo
                                                                        • Ctrl + Enter: Execute the selected line or content.
                                                                        • Ctrl + Alt + F: Flag
                                                                        • Ctrl + Shift + K: Search for the previous one.
                                                                        • Ctrl + K: Search for the next one.
                                                                        • Ctrl + Backspace: Delete the word to the left of the cursor.
                                                                        • Ctrl + Delete: Delete the word to the right of the cursor.
                                                                        • Alt + Backspace: Delete all content from the beginning of the line to the cursor.
                                                                        • Alt + Delete: Delete all content from the cursor to the end of the line.
                                                                        • Alt + Shift-Left: Select all content from the beginning of the line to the cursor.
                                                                        • Alt + Shift-Right: Select all content from the cursor to the end of the line.
                                                                      • Script parameters

                                                                        Enter script parameters in the SQL statement and click Parameter Setup in the right pane of the editor and then click Update from Script. You can also directly configure parameters and constants for the job script.

                                                                        In the following script example, str1 indicates the parameter name. It can contain only letters, digits, hyphens (-), underscores (_), greater-than signs (>), and less-than signs (<), and can contain a maximum of 16 characters. The parameter name must be unique.

                                                                        select ${str1} from data;
                                                                      -
                                                                    • (Optional) In the upper part of the editor, click Format to format SQL statements.
                                                                    • Above the editor, click to save the job and submit it.
                                                                    • +
                                                                    • (Optional) In the upper part of the editor, click Format to format SQL statements.
                                                                    • Above the editor, click Save to save the job and submit it.
                                                                    -

                                                                    Configuring Job Parameters

                                                                    Job parameters can be globally used in any node in jobs. The procedure is as follows:

                                                                    -

                                                                    Click Parameters on the right of the editor and set the parameters described in Table 4.

                                                                    +

                                                                    Configuring Job Parameters

                                                                    Click Parameters on the right of the editor and set the parameters described in Table 4.

                                                                    -
                                                                    Table 4 Job parameters

                                                                    Function

                                                                    +
                                                                    - - - - - - - - - - - - - - - - - - - - - - - @@ -264,40 +272,40 @@ select * from a where b="dsfa\;"; --example 1\;example 2.

                                                                    Click the Parameter Preview tab and configure the parameters listed in Table 5.

                                                                    -
                                                                    Table 4 Job parameters

                                                                    Function

                                                                    Description

                                                                    +

                                                                    Description

                                                                    Variables

                                                                    +

                                                                    Variables

                                                                    Add

                                                                    +

                                                                    Add

                                                                    Click Add and enter the variable parameter name and parameter value in the text boxes.

                                                                    -
                                                                    • Parameter name

                                                                      Only letters, digits, hyphens (-), and underscores (_) are allowed.

                                                                      +

                                                                    Click Add and enter the variable parameter name and parameter value in the text boxes.

                                                                    +
                                                                    • Parameter name

                                                                      Only letters, numbers, periods (.), hyphens (-), and underscores (_) are allowed.

                                                                    • Parameter value
                                                                      • The string type of parameter value is a character string, for example, str1.
                                                                      • The numeric type of parameter value is a number or operation expression.

                                                                    After the parameter is configured, it is referenced in the format of ${parameter name} in the job.

                                                                    Edit Parameter Expression

                                                                    +

                                                                    Edit Parameter Expression

                                                                    Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                                    +

                                                                    Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                                    Modify

                                                                    +

                                                                    Modify

                                                                    Change the parameter name or value in the corresponding text boxes.

                                                                    +

                                                                    Change the parameter name or value in the corresponding text boxes.

                                                                    Mask

                                                                    +

                                                                    Mask

                                                                    If the parameter value is a key, click to mask the value for security purposes.

                                                                    +

                                                                    If the parameter value is a key, click to mask the value for security purposes.

                                                                    Delete

                                                                    +

                                                                    Delete

                                                                    Click next to the parameter name and value text boxes to delete the job parameter.

                                                                    +

                                                                    Click next to the parameter name and value text boxes to delete the job parameter.

                                                                    Constant Parameter

                                                                    +

                                                                    Constant Parameter

                                                                    Add

                                                                    +

                                                                    Add

                                                                    Click Add and enter the constant parameter name and parameter value in the text boxes.

                                                                    -
                                                                    • Parameter name

                                                                      Only letters, digits, hyphens (-), and underscores (_) are allowed.

                                                                      +

                                                                    Click Add and enter the constant parameter name and parameter value in the text boxes.

                                                                    +
                                                                    • Parameter name

                                                                      Only letters, numbers, periods (.), hyphens (-), and underscores (_) are allowed.

                                                                    • Parameter value
                                                                      • The string type of parameter value is a character string, for example, str1.
                                                                      • The numeric type of parameter value is a number or operation expression.

                                                                    After the parameter is configured, it is referenced in the format of ${parameter name} in the job.

                                                                    Edit Parameter Expression

                                                                    +

                                                                    Edit Parameter Expression

                                                                    Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                                    +

                                                                    Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                                    Modify

                                                                    +

                                                                    Modify

                                                                    Modify the parameter name and parameter value in text boxes and save the modifications.

                                                                    +

                                                                    Modify the parameter name and parameter value in text boxes and save the modifications.

                                                                    Delete

                                                                    +

                                                                    Delete

                                                                    Click next to the parameter name and value text boxes to delete the job parameter.

                                                                    +

                                                                    Click next to the parameter name and value text boxes to delete the job parameter.

                                                                    Workspace Environment Variables

                                                                    +

                                                                    Workspace Environment Variables

                                                                    View the variables and constants that have been configured in the workspace.

                                                                    +

                                                                    View the variables and constants that have been configured in the workspace.

                                                                    Table 5 Job parameter preview

                                                                    Function

                                                                    +
                                                                    - - - - - - - - - - - - - @@ -310,10 +318,12 @@ select * from a where b="dsfa\;"; --example 1\;example 2.

                                                                    Saving a Job

                                                                    After configuring the job, perform the following operations:

                                                                    -
                                                                    1. Click to execute the job.
                                                                    2. After the job is executed, click to save the job configuration.

                                                                      After the job is saved, a version is automatically generated and displayed in Versions. The version can be rolled back. If you save a job multiple times within a minute, only one version is recorded. If the intermediate data is important, you can click Save new version to save and add a version.

                                                                      +
                                                                      1. Click Start to execute the job. When viewing the script execution result, you can double-click a field in any row to view the result details. You can copy the field name.

                                                                        A maximum of 1,000 records can be displayed in the execution result. The size of the execution result cannot exceed 3 MB. If the size exceeds 3 MB, the result will be truncated.

                                                                        +
                                                                        +

                                                                      2. After the job is executed, click to save the job configuration.

                                                                        After the job is saved, a version is automatically generated and displayed in Versions. The version can be rolled back. If you save a job multiple times within a minute, only one version is recorded. If the intermediate data is important, you can click Save new version to save and add a version.

                                                                    -

                                                                    Templates

                                                                    When developing a real-time processing, single-task Flink SQL job, you can reference a script template. For details about how to create a template, see Configuring a Template. For details about how to use a script template, see Using Script Templates and Parameter Templates.

                                                                    +

                                                                    Templates

                                                                    When developing a real-time processing, single-task Flink SQL job, you can use a public script template. For details about how to create a template, see Configuring a Template. For details about how to use a script template, see Using Script Templates and Parameter Templates.

                                                                    @@ -322,3 +332,10 @@ select * from a where b="dsfa\;"; --example 1\;example 2.
                                                                    + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1824.html b/docs/dataartsstudio/umn/dataartsstudio_01_1824.html index 884a68e65..194918ea6 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1824.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1824.html @@ -1,10 +1,10 @@ -

                                                                    Developing a Real-Time Processing Single-Task Flink Jar Job

                                                                    +

                                                                    Developing a Real-Time Processing Single-Task MRS Flink Jar Job

                                                                    Prerequisites

                                                                    A single-task real-time processing Flink Jar job has been created. For details, see Creating a Job.

                                                                    -

                                                                    Configuring the Flink Jar Job

                                                                    -
                                                                    Table 5 Job parameter preview

                                                                    Function

                                                                    Description

                                                                    +

                                                                    Description

                                                                    Current Time

                                                                    +

                                                                    Current Time

                                                                    This parameter is displayed only when Scheduling Type is set to Run once. The default value is the current time.

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run once. The default value is the current time.

                                                                    Event Triggering Time

                                                                    +

                                                                    Event Triggering Time

                                                                    This parameter is displayed only when Scheduling Type is set to Event-based. The default value is the time when an event is triggered.

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Event-based. The default value is the time when an event is triggered.

                                                                    Scheduling Period

                                                                    +

                                                                    Scheduling Period

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The default value is the scheduling period.

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The default value is the scheduling period.

                                                                    Start Time

                                                                    +

                                                                    Start Time

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the configured job execution time.

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the configured job execution time.

                                                                    Start Time

                                                                    +

                                                                    Start Time

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the time when the periodic job scheduling starts.

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the time when the periodic job scheduling starts.

                                                                    Subsequent Instances

                                                                    +

                                                                    Subsequent Instances

                                                                    Number of job instances scheduled.

                                                                    +

                                                                    Number of job instances scheduled.

                                                                    • The default value is 1 when Scheduling Type is set to Run once.
                                                                    • The default value is 1 when Scheduling Type is set to Event-based.
                                                                    • When Scheduling Type is set to Run periodically:

                                                                      If the number of instances exceeds 10, a maximum of 10 instances can be displayed, and the system displays message "A maximum of 10 instances are supported."

                                                                    -
                                                                    Table 1 Properties

                                                                    Parameter

                                                                    +

                                                                    Configuring the MRS Flink Jar Job

                                                                    +
                                                                    @@ -18,7 +18,7 @@ - @@ -137,6 +138,194 @@
                                                                    Table 1 MRS Flink Jar job parameters

                                                                    Parameter

                                                                    Mandatory

                                                                    Enter the Flink job name.

                                                                    The name is automatically generated in Workspace-Job name format.

                                                                    -

                                                                    The job name can contain 1 to 64 characters. Only letters, digits, hyphens (-), and underscores (_) are allowed.

                                                                    +

                                                                    The job name can contain 1 to 64 characters. Only letters, digits, hyphens (-), and underscores (_) are allowed. Chinese characters are not allowed.

                                                                    MRS Cluster

                                                                    @@ -34,7 +34,7 @@

                                                                    No

                                                                    Set job running parameters.

                                                                    +

                                                                    Set job running parameters. This parameter is displayed only after an MRS cluster is selected.

                                                                    (Optional) Configure optimization parameters such as threads, memory, and vCPUs for the job to optimize resource usage and improve job execution performance.

                                                                    CAUTION:

                                                                    You can query historical checkpoints and select a specified checkpoint to start a Flink JAR job. To make a Flink checkpoint take effect, configure the following two parameters:

                                                                    • Checkpoint interval:

                                                                      -yD: execution.checkpointing.interval=1000

                                                                      @@ -45,7 +45,7 @@
                                                                      NOTE:

                                                                      This parameter is mandatory if the cluster version is MRS 1.8.7 or later than MRS 2.0.1.

                                                                      Click Select Template and select a parameter template. You can also select multiple templates. For details on how to create data connections, see Configuring a Template.

                                                                      -

                                                                      For details about the parameters of MRS Flink jobs, see Managing an Existing Cluster > Job Management > Running a Flink Job in MapReduce Service (MRS) User Guide.

                                                                      +

                                                                      For details about the parameters of MRS Flink jobs, see Managing an Existing Cluster > Job Management > Running a Flink Job in MapReduce Service (MRS) User Guide.

                                                                    Job Execution Parameter

                                                                    @@ -61,6 +61,7 @@

                                                                    No

                                                                    Select a created MRS resource queue.

                                                                    +

                                                                    This parameter is mandatory if Whether MRS Resource Queue Is Mandatory is set to Yes.

                                                                    Select a queue you configured in the queue permissions of DataArts Security. If you set multiple resource queues for this node, the resource queue you select here has the highest priority.

                                                                    +

                                                                    After setting the parameters, click Save and submit the job.

                                                                    +

                                                                    Click Start to run the job.

                                                                    +
                                                                    +

                                                                    Configuring Basic Job Information

                                                                    +
                                                                    + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                                    Table 3 Basic job information

                                                                    Parameter

                                                                    +

                                                                    Description

                                                                    +

                                                                    Owner

                                                                    +

                                                                    An owner configured during job creation is automatically matched. This parameter value can be modified.

                                                                    +

                                                                    Executor

                                                                    +

                                                                    This parameter is available when Scheduling Identities is set to Yes.

                                                                    +

                                                                    User that executes the job. When you enter an executor, the job is executed by the executor. If the executor is left unspecified, the job is executed by the user who submitted the job for startup.

                                                                    +
                                                                    NOTE:

                                                                    You can configure execution users only after you apply for the whitelist membership. To enable it, contact customer service or technical support.

                                                                    +
                                                                    +

                                                                    Job Agency

                                                                    +

                                                                    This parameter is available when Scheduling Identities is set to Yes.

                                                                    +

                                                                    After an agency is configured, the job interacts with other services as an agency during job execution.

                                                                    +

                                                                    Priority

                                                                    +

                                                                    Priority configured during job creation is automatically matched. This parameter value can be modified.

                                                                    +

                                                                    Execution Timeout

                                                                    +

                                                                    Timeout of the job instance. If this parameter is set to 0 or is not set, this parameter does not take effect. If the notification function is enabled for the job and the execution time of the job instance exceeds the preset value, the system sends a specified notification, and the job keeps running.

                                                                    +

                                                                    Exclude Waiting Time from Instance Timeout Duration

                                                                    +

                                                                    Whether to exclude the wait time from the instance execution timeout duration

                                                                    +

                                                                    If you select this option, the time to wait before an instance starts running is excluded from the timeout duration. You can modify this setting in Default Configuration > Exclude Waiting Time from Instance Timeout Duration.

                                                                    +

                                                                    If you do not select this option, the time to wait before an instance starts running is included in the timeout duration.

                                                                    +

                                                                    Custom Parameter

                                                                    +

                                                                    Set the name and value of the parameter.

                                                                    +

                                                                    Job Tag

                                                                    +

                                                                    Configure job tags to manage jobs by category.

                                                                    +

                                                                    Click Add to add a tag to the job. You can also select a tag configured in Managing Job Tags.

                                                                    +

                                                                    Job Description

                                                                    +

                                                                    Description of the job

                                                                    +
                                                                    +
                                                                    +
                                                                    +

                                                                    Configuring Job Parameters

                                                                    Click Parameters on the right of the editor and set the parameters described in Table 4.

                                                                    + +
                                                                    + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                                    Table 4 Job parameters

                                                                    Function

                                                                    +

                                                                    Description

                                                                    +

                                                                    Variables

                                                                    +

                                                                    Add

                                                                    +

                                                                    Click Add and enter the variable parameter name and parameter value in the text boxes.

                                                                    +
                                                                    • Parameter name

                                                                      Only letters, numbers, periods (.), hyphens (-), and underscores (_) are allowed.

                                                                      +
                                                                    • Parameter value
                                                                      • The string type of parameter value is a character string, for example, str1.
                                                                      • The numeric type of parameter value is a number or operation expression.
                                                                      +
                                                                    +

                                                                    After the parameter is configured, it is referenced in the format of ${parameter name} in the job.

                                                                    +

                                                                    Edit Parameter Expression

                                                                    +

                                                                    Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                                    +

                                                                    Modify

                                                                    +

                                                                    Change the parameter name or value in the corresponding text boxes.

                                                                    +

                                                                    Mask

                                                                    +

                                                                    If the parameter value is a key, click to mask the value for security purposes.

                                                                    +

                                                                    Delete

                                                                    +

                                                                    Click next to the parameter name and value text boxes to delete the job parameter.

                                                                    +

                                                                    Constant Parameter

                                                                    +

                                                                    Add

                                                                    +

                                                                    Click Add and enter the constant parameter name and parameter value in the text boxes.

                                                                    +
                                                                    • Parameter name

                                                                      Only letters, numbers, periods (.), hyphens (-), and underscores (_) are allowed.

                                                                      +
                                                                    • Parameter value
                                                                      • The string type of parameter value is a character string, for example, str1.
                                                                      • The numeric type of parameter value is a number or operation expression.
                                                                      +
                                                                    +

                                                                    After the parameter is configured, it is referenced in the format of ${parameter name} in the job.

                                                                    +

                                                                    Edit Parameter Expression

                                                                    +

                                                                    Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                                    +

                                                                    Modify

                                                                    +

                                                                    Modify the parameter name and parameter value in text boxes and save the modifications.

                                                                    +

                                                                    Delete

                                                                    +

                                                                    Click next to the parameter name and value text boxes to delete the job parameter.

                                                                    +

                                                                    Workspace Environment Variables

                                                                    +

                                                                    View the variables and constants that have been configured in the workspace.

                                                                    +
                                                                    +
                                                                    +

                                                                    Click the Parameter Preview tab and configure the parameters listed in Table 5.

                                                                    + +
                                                                    + + + + + + + + + + + + + + + + + + + + + + +
                                                                    Table 5 Job parameter preview

                                                                    Function

                                                                    +

                                                                    Description

                                                                    +

                                                                    Current Time

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run once. The default value is the current time.

                                                                    +

                                                                    Event Triggering Time

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Event-based. The default value is the time when an event is triggered.

                                                                    +

                                                                    Scheduling Period

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The default value is the scheduling period.

                                                                    +

                                                                    Start Time

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the configured job execution time.

                                                                    +

                                                                    Start Time

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the time when the periodic job scheduling starts.

                                                                    +

                                                                    Subsequent Instances

                                                                    +

                                                                    Number of job instances scheduled.

                                                                    +
                                                                    • The default value is 1 when Scheduling Type is set to Run once.
                                                                    • The default value is 1 when Scheduling Type is set to Event-based.
                                                                    • When Scheduling Type is set to Run periodically:

                                                                      If the number of instances exceeds 10, a maximum of 10 instances can be displayed, and the system displays message "A maximum of 10 instances are supported."

                                                                      +
                                                                    +
                                                                    +
                                                                    +

                                                                    In Parameter Preview, if a job parameter has a syntax error, the system displays a message.

                                                                    +

                                                                    If a parameter depends on the data generated during job execution, such data cannot be simulated and displayed in Parameter Preview.

                                                                    +
                                                                    diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1825.html b/docs/dataartsstudio/umn/dataartsstudio_01_1825.html index 98a33b849..447118cc2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1825.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1825.html @@ -31,7 +31,7 @@

                                                                    No

                                                                    • 2.3.2
                                                                    • 2.4.5
                                                                    • 3.1.1
                                                                    +
                                                                    • 2.3.2
                                                                    • 2.4.5
                                                                    • 3.1.1
                                                                    • 3.3.1

                                                                    Job Type

                                                                    @@ -156,6 +156,194 @@
                                                                    +

                                                                    After setting the parameters, click Save and submit the job.

                                                                    +

                                                                    Click Start to run the job.

                                                                    + +

                                                                    Configuring Basic Job Information

                                                                    +
                                                                    + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                                    Table 3 Basic job information

                                                                    Parameter

                                                                    +

                                                                    Description

                                                                    +

                                                                    Owner

                                                                    +

                                                                    An owner configured during job creation is automatically matched. This parameter value can be modified.

                                                                    +

                                                                    Executor

                                                                    +

                                                                    This parameter is available when Scheduling Identities is set to Yes.

                                                                    +

                                                                    User that executes the job. When you enter an executor, the job is executed by the executor. If the executor is left unspecified, the job is executed by the user who submitted the job for startup.

                                                                    +
                                                                    NOTE:

                                                                    You can configure execution users only after you apply for the whitelist membership. To enable it, contact customer service or technical support.

                                                                    +
                                                                    +

                                                                    Job Agency

                                                                    +

                                                                    This parameter is available when Scheduling Identities is set to Yes.

                                                                    +

                                                                    After an agency is configured, the job interacts with other services as an agency during job execution.

                                                                    +

                                                                    Priority

                                                                    +

                                                                    Priority configured during job creation is automatically matched. This parameter value can be modified.

                                                                    +

                                                                    Execution Timeout

                                                                    +

                                                                    Timeout of the job instance. If this parameter is set to 0 or is not set, this parameter does not take effect. If the notification function is enabled for the job and the execution time of the job instance exceeds the preset value, the system sends a specified notification, and the job keeps running.

                                                                    +

                                                                    Exclude Waiting Time from Instance Timeout Duration

                                                                    +

                                                                    Whether to exclude the wait time from the instance execution timeout duration

                                                                    +

                                                                    If you select this option, the time to wait before an instance starts running is excluded from the timeout duration. You can modify this setting in Default Configuration > Exclude Waiting Time from Instance Timeout Duration.

                                                                    +

                                                                    If you do not select this option, the time to wait before an instance starts running is included in the timeout duration.

                                                                    +

                                                                    Custom Parameter

                                                                    +

                                                                    Set the name and value of the parameter.

                                                                    +

                                                                    Job Tag

                                                                    +

                                                                    Configure job tags to manage jobs by category.

                                                                    +

                                                                    Click Add to add a tag to the job. You can also select a tag configured in Managing Job Tags.

                                                                    +

                                                                    Job Description

                                                                    +

                                                                    Description of the job

                                                                    +
                                                                    +
                                                                    +
                                                                    +

                                                                    Configuring job parameters

                                                                    Click Parameter Setup on the right of the editor and set the parameters described in Table 4.

                                                                    + +
                                                                    + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                                    Table 4 Job parameter setup

                                                                    Module

                                                                    +

                                                                    Description

                                                                    +

                                                                    Variables

                                                                    +

                                                                    Add

                                                                    +

                                                                    Click Add and enter the variable parameter name and parameter value in the text boxes.

                                                                    +
                                                                    • Parameter

                                                                      Only letters, numbers, periods (.), hyphens (-), and underscores (_) are allowed.

                                                                      +
                                                                    • Parameter Value
                                                                      • The string type of parameter value is a character string, for example, str1.
                                                                      • The numeric type of parameter value is a number or operation expression.
                                                                      +
                                                                    +

                                                                    After the parameter is configured, it is referenced in the format of ${Parameter name} in the job.

                                                                    +

                                                                    Edit Parameter Expression

                                                                    +

                                                                    Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                                    +

                                                                    Modifying a Job

                                                                    +

                                                                    Change the parameter name or value in the corresponding text boxes.

                                                                    +

                                                                    Mask

                                                                    +

                                                                    If the parameter value is a key, click to mask the value for security purposes.

                                                                    +

                                                                    Delete

                                                                    +

                                                                    Click next to the parameter name and value text boxes to delete the job parameter.

                                                                    +

                                                                    Constant Parameter

                                                                    +

                                                                    Add

                                                                    +

                                                                    Click Add and enter the constant parameter name and parameter value in the text boxes.

                                                                    +
                                                                    • Parameter

                                                                      Only letters, numbers, periods (.), hyphens (-), and underscores (_) are allowed.

                                                                      +
                                                                    • Parameter Value
                                                                      • The string type of parameter value is a character string, for example, str1.
                                                                      • The numeric type of parameter value is a number or operation expression.
                                                                      +
                                                                    +

                                                                    After the parameter is configured, it is referenced in the format of ${Parameter name} in the job.

                                                                    +

                                                                    Edit Parameter Expression

                                                                    +

                                                                    Click next to the parameter value text box. In the displayed dialog box, edit the parameter expression. For more expressions, see Expression Overview.

                                                                    +

                                                                    Modifying a Job

                                                                    +

                                                                    Modify the parameter name and parameter value in text boxes and save the modifications.

                                                                    +

                                                                    Delete

                                                                    +

                                                                    Click next to the parameter name and value text boxes to delete the job parameter.

                                                                    +

                                                                    Workspace Environment Variables

                                                                    +

                                                                    View the variables and constants that have been configured in the workspace.

                                                                    +
                                                                    +
                                                                    +

                                                                    Click the Parameter Preview tab and configure the parameters listed in Table 5.

                                                                    + +
                                                                    + + + + + + + + + + + + + + + + + + + + + + +
                                                                    Table 5 Job parameter preview

                                                                    Module

                                                                    +

                                                                    Description

                                                                    +

                                                                    Current Time

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run once. The default value is the current time.

                                                                    +

                                                                    Event Triggering Time

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Event-based. The default value is the time when an event is triggered.

                                                                    +

                                                                    Scheduling Period

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The default value is the scheduling period.

                                                                    +

                                                                    Start Time

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the configured job execution time.

                                                                    +

                                                                    Start Time

                                                                    +

                                                                    This parameter is displayed only when Scheduling Type is set to Run periodically. The value is the time when the periodic job scheduling starts.

                                                                    +

                                                                    Subsequent Instances

                                                                    +

                                                                    Number of job instances scheduled.

                                                                    +
                                                                    • The default value is 1 when Scheduling Type is set to Run once.
                                                                    • The default value is 1 when Scheduling Type is set to Event-based.
                                                                    • When Scheduling Type is set to Run periodically:

                                                                      If the number of instances exceeds 10, a maximum of 10 instances can be displayed, and the system displays message "A maximum of 10 instances are supported."

                                                                      +
                                                                    +
                                                                    +
                                                                    +

                                                                    In Parameter Preview, if a job parameter has a syntax error, the system displays a message.

                                                                    +

                                                                    If a parameter depends on the data generated during job execution, such data cannot be simulated and displayed in Parameter Preview.

                                                                    +
                                                                    diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1902.html b/docs/dataartsstudio/umn/dataartsstudio_01_1902.html index 04017b3f7..faa39be44 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1902.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1902.html @@ -1,23 +1,22 @@

                                                                    Releasing a Script Task

                                                                    -

                                                                    In enterprise mode, when a developer submits a script version, the system generates a script release task. After the developer confirms releasing a package and the admin, deployer, a user with the DARTS Administrator or Tenant Administrator permission approves the package release request, the modified script is synchronized to the production environment.

                                                                    +

                                                                    In enterprise mode, when a developer submits a script version, the system generates a script release task. After the developer confirms releasing a package and the admin, deployer, a user with the DARTS Administrator or Tenant Administrator permission approves the package release request, the modified script is synchronized to the production environment.

                                                                    • If the admin imported a submitted script, a release task will be generated.
                                                                    • If the admin imported a released script, no release task will be generated.

                                                                    Prerequisites

                                                                    You have submitted a version. For details, see Submitting a Version.

                                                                    -

                                                                    Procedure

                                                                    1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                    2. In the left navigation pane, choose Data Development > Task Release.
                                                                    3. On the Tasks page, the tasks generated for version submission are displayed. You can click View in the Operation column to view the modifications of a script compared with its previous version. After confirming that the modifications are correct, click Release to release the task.

                                                                      You can filter tasks by name or submitter, and perform fuzzy search using a task name.
                                                                      • If you have only the developer permission, the script will be synchronized to the production environment only when the task is approved by the admin or deployer.
                                                                      • After clicking Release, set the reviewer. The reviewer must be a workspace admin, deployer, or a user with the DARTS Administrator or Tenant Administrator permission. Set at least one reviewer and do not set yourself as the reviewer. Click Reviewer Information to go to the Workspaces page. Click Edit to configure reviewers.
                                                                      • You can release a maximum of 100 tasks at a time. The tasks are released asynchronously. You can view the task release process.
                                                                      • You can revoke tasks not to be released as a developer, deployer, or admin.
                                                                      +

                                                                      Procedure

                                                                      1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                      2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                      3. In the left navigation pane, choose Data Development > Task Release.
                                                                      4. On the Tasks page, the tasks generated for version submission are displayed. You can click View in the Operation column to view the modifications of a script compared with its previous version. After confirming that the modifications are correct, click Release to release the task.

                                                                        You can filter tasks by name or submitter, and perform fuzzy search using a task name.
                                                                        • If you have only the developer permission, the script will be synchronized to the production environment only when the task is approved by the admin or deployer.
                                                                        • After clicking Release, set the reviewer. The reviewer must be a workspace admin, deployer, or a user with the DARTS Administrator or Tenant Administrator permission. Set at least one reviewer and do not set yourself as the reviewer. Click Reviewer Information to go to the Workspaces page. Click Edit to configure reviewers.
                                                                        • You can release a maximum of 100 tasks at a time. The tasks are released asynchronously. You can view the task release process.
                                                                        • You can revoke tasks not to be released as a developer, deployer, or admin.
                                                                        -
                                                                        Figure 1 Clicking Release
                                                                        +
                                                                        Figure 1 Clicking Release
                                                                        -

                                                                        -

                                                                      5. After the task is released, you can view the release status of the task on the Packages tab page. After approved, the task is released successfully.

                                                                        You can filter packages by Applicant, Application Time, Release At, or Released By, and perform fuzzy search using a package name.
                                                                        Figure 2 Viewing the task status
                                                                        +

                                                                      6. After the task is released, you can view the release status of the task on the Packages tab page. After approved, the task is released successfully.

                                                                        You can filter packages by Applicant, Application Time, Release At, or Released By, and perform fuzzy search using a package name.
                                                                        Figure 2 Viewing the task status

                                                                        You can revoke tasks not to be released as a developer, deployer, or admin.

                                                                        After the task is released, you can click View Details in the Operation column to view the release status and startup status of the task. You can also click Compare Version in the Operation column to view the differences between different versions of release packages.

                                                                        -
                                                                        Figure 3 Viewing release package details
                                                                        +
                                                                        Figure 3 Viewing release package details

                                                                      @@ -28,3 +27,10 @@
                                                                      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_1903.html b/docs/dataartsstudio/umn/dataartsstudio_01_1903.html index 4637d2537..bcd8fc47c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_1903.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_1903.html @@ -1,23 +1,22 @@

                                                                      Releasing a Job Task

                                                                      -

                                                                      In enterprise mode, when a developer submits a job version, the system generates a job release task. After the developer confirms the release task and the admin, deployer, a user with the DARTS Administrator or Tenant Administrator permission approves the package release request, the modified job is synchronized to the production environment.

                                                                      +

                                                                      In enterprise mode, when a developer submits a job version, the system generates a job release task. After the developer confirms releasing a package and the admin, deployer, a user with the DARTS Administrator or Tenant Administrator permission approves the package release request, the modified job is synchronized to the production environment.

                                                                      • When the admin selects Submitted for Job Status during job import, a release task is generated.
                                                                      • When the admin imports jobs in released state, no release task is generated.
                                                                      • When a developer creates a real-time single-task job, a release task is generated for the job, and no release task is generated for the subjobs of the job.

                                                                      Prerequisites

                                                                      You have submitted a version. For details, see Submitting a Version.

                                                                      -

                                                                      Procedure

                                                                      1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                      2. In the left navigation pane, choose Data Development > Task Release.
                                                                      3. On the Tasks page, the tasks generated for version submission are displayed. You can click View in the Operation column to view the modifications of a script compared with its previous version. After confirming that the modifications are correct, click Release to release the task.

                                                                        You can filter release tasks by name or submitter. and perform fuzzy search using a task name.

                                                                        -
                                                                        • If you have only the developer permission, the script will be synchronized to the production environment only when the task is approved by the admin or deployer.
                                                                        • After clicking Release, set the reviewer. The reviewer must be a workspace admin, deployer, or a user with the DARTS Administrator or Tenant Administrator permission. Set at least one reviewer and do not set yourself as the reviewer. Click Reviewer Management to go to the WorkSpaces page. Click Edit to configure reviewers.
                                                                        • You can release a maximum of 100 tasks at a time. The tasks are released asynchronously. You can view the task release process.
                                                                        • After you click Release, the following message is displayed: "Execute jobs in the package immediately after it is released."
                                                                        • You can revoke tasks not to be released as a developer, deployer, or admin.
                                                                        +

                                                                        Procedure

                                                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                        2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                        3. In the left navigation pane, choose Data Development > Task Release.
                                                                        4. On the Tasks page, the tasks generated for version submission are displayed. You can click View in the Operation column to view the modifications of a script compared with its previous version. After confirming that the modifications are correct, click Release to release the task.

                                                                          You can filter release tasks by name or submitter. and perform fuzzy search using a task name.

                                                                          +
                                                                          • If you have only the developer permission, the script will be synchronized to the production environment only when the task is approved by the admin or deployer.
                                                                          • After clicking Release, set the reviewer. The reviewer must be a workspace admin, deployer, or a user with the DARTS Administrator or Tenant Administrator permission. Set at least one reviewer and do not set yourself as the reviewer. Click Reviewer Management to go to the WorkSpaces page. Click Edit to configure reviewers.
                                                                          • You can release a maximum of 100 tasks at a time. The tasks are released asynchronously. You can view the task release process.
                                                                          • After you click Release, the following message is displayed: "Execute jobs in the package immediately after it is released."
                                                                          • You can revoke tasks not to be released as a developer, deployer, or admin.
                                                                          -
                                                                          Figure 1 Clicking Release
                                                                          -

                                                                          -

                                                                        5. After the task is released, you can view the release status of the task on the Packages tab page. After approved, the task is released successfully.

                                                                          You can filter release tasks by Applicant, Application Time, Release At, or Released By, and perform fuzzy search using a package name.
                                                                          Figure 2 Viewing the task status
                                                                          +
                                                                          Figure 1 Clicking Release
                                                                          +

                                                                        6. After the task is released, you can view the release status of the task on the Packages tab page. After approved, the task is released successfully.

                                                                          You can filter release tasks by Applicant, Application Time, Release At, or Released By, and perform fuzzy search using a package name.
                                                                          Figure 2 Viewing the task status

                                                                          You can revoke tasks not to be released as a developer, deployer, or admin.

                                                                          After the task is released, you can click View Details in the Operation column to view the release status and startup status of the task. You can also click Compare Version in the Operation column to view the differences between different versions of release packages.

                                                                          -
                                                                          Figure 3 Viewing release package details
                                                                          +
                                                                          Figure 3 Viewing release package details

                                                                        @@ -28,3 +27,10 @@
                                                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_2000.html b/docs/dataartsstudio/umn/dataartsstudio_01_2000.html index 14d57eca9..572b04742 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_2000.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_2000.html @@ -1,841 +1,842 @@

                                                                        Auto Table Creation

                                                                        -

                                                                        Field Mapping in Automatic Table Creation

                                                                        Figure 1 describes the field mapping between the DWS tables created by CDM and source tables. For example, if you use CDM to migrate the Oracle database to DWS, CDM automatically creates a table on DWS and maps the NUMBER(3,0) field of the Oracle database to the SMALLINT field of DWS.

                                                                        -
                                                                        Figure 1 Field mapping in automatic table creation
                                                                        -

                                                                        Table 1, Table 2, Table 3, and Table 4 describe the field type mapping between Hive tables and source tables when CDM automatically creates tables in Hive. For example, if you use CDM to migrate the MySQL database to Hive, CDM automatically creates a table on Hive and maps the YEAR field of the MySQL database to the DATE field of Hive.

                                                                        +

                                                                        CDM converts the field type of the source to the field type of the destination based on the default rule and creates a table at the destination.

                                                                        +

                                                                        Field Mapping in Automatic Table Creation

                                                                        Figure 1 describes the field mapping between the DWS tables created by CDM and source tables. For example, if you use CDM to migrate the Oracle database to DWS, CDM automatically creates a table on DWS and maps the NUMBER(3,0) field of the Oracle database to the SMALLINT field of DWS.

                                                                        +
                                                                        Figure 1 Field mapping in automatic table creation
                                                                        +

                                                                        Table 1, Table 2, Table 3, and Table 4 describe the field type mapping between Hive tables and source tables when CDM automatically creates tables in Hive. For example, if you use CDM to migrate the MySQL database to Hive, CDM automatically creates a table on Hive and maps the YEAR field of the MySQL database to the DATE field of Hive.

                                                                        • For the DECIMAL type, if the length of the source data exceeds the Hive length, the precision may be lost.
                                                                        • For the DECIMAL type, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the source is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0. In this case, precision loss may occur after data is written.
                                                                        -
                                                                        Table 1 Field mapping in automatic table creation for MySQL-to-Hive migration

                                                                        Data Type (MySQL)

                                                                        +
                                                                        - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
                                                                        Table 1 Field mapping in automatic table creation for MySQL-to-Hive migration

                                                                        Data Type (MySQL)

                                                                        Data Type (Hive)

                                                                        +

                                                                        Data Type (Hive)

                                                                        Description

                                                                        +

                                                                        Description

                                                                        Value

                                                                        +

                                                                        Value

                                                                        tinyint(1), bit(1)

                                                                        +

                                                                        tinyint(1), bit(1)

                                                                        BOOLEAN

                                                                        +

                                                                        BOOLEAN

                                                                        -

                                                                        +

                                                                        -

                                                                        TINYINT

                                                                        +

                                                                        TINYINT

                                                                        SMALLINT

                                                                        +

                                                                        SMALLINT

                                                                        -

                                                                        +

                                                                        -

                                                                        TINYINT UNSIGNED

                                                                        +

                                                                        TINYINT UNSIGNED

                                                                        SMALLINT

                                                                        +

                                                                        SMALLINT

                                                                        -

                                                                        +

                                                                        -

                                                                        SMALLINT

                                                                        +

                                                                        SMALLINT

                                                                        SMALLINT

                                                                        +

                                                                        SMALLINT

                                                                        -

                                                                        +

                                                                        -

                                                                        SMALLINT UNSIGNED

                                                                        +

                                                                        SMALLINT UNSIGNED

                                                                        INTEGER

                                                                        +

                                                                        INTEGER

                                                                        -

                                                                        +

                                                                        -

                                                                        MEDIUMINT

                                                                        +

                                                                        MEDIUMINT

                                                                        INTEGER

                                                                        +

                                                                        INTEGER

                                                                        -

                                                                        +

                                                                        -

                                                                        MEDIUMINT UNSIGNED

                                                                        +

                                                                        MEDIUMINT UNSIGNED

                                                                        BIGINT

                                                                        +

                                                                        BIGINT

                                                                        -

                                                                        +

                                                                        -

                                                                        INT

                                                                        +

                                                                        INT

                                                                        INTEGER

                                                                        +

                                                                        INTEGER

                                                                        -

                                                                        +

                                                                        -

                                                                        INT UNSIGNED

                                                                        +

                                                                        INT UNSIGNED

                                                                        BIGINT

                                                                        +

                                                                        BIGINT

                                                                        -

                                                                        +

                                                                        -

                                                                        BIGINT

                                                                        +

                                                                        BIGINT

                                                                        BIGINT

                                                                        +

                                                                        BIGINT

                                                                        -

                                                                        +

                                                                        -

                                                                        BIGINT UNSIGNED

                                                                        +

                                                                        BIGINT UNSIGNED

                                                                        DECIMAL(38,0)

                                                                        +

                                                                        DECIMAL(38,0)

                                                                        -

                                                                        +

                                                                        -

                                                                        DECIMAL(P,S)

                                                                        +

                                                                        DECIMAL(P,S)

                                                                        DECIMAL(P,S)

                                                                        +

                                                                        DECIMAL(P,S)

                                                                        The MySQL database supports a maximum of 65 bits. For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        +

                                                                        The MySQL database supports a maximum of 65 bits. For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        -

                                                                        +

                                                                        -

                                                                        FLOAT UNSIGNED

                                                                        +

                                                                        FLOAT UNSIGNED

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        -

                                                                        +

                                                                        -

                                                                        DOUBLE

                                                                        +

                                                                        DOUBLE

                                                                        DOUBLE

                                                                        +

                                                                        DOUBLE

                                                                        -

                                                                        +

                                                                        -

                                                                        DOUBLE UNSIGNED

                                                                        +

                                                                        DOUBLE UNSIGNED

                                                                        DOUBLE

                                                                        +

                                                                        DOUBLE

                                                                        -

                                                                        +

                                                                        -

                                                                        Time

                                                                        +

                                                                        Time

                                                                        DATE

                                                                        +

                                                                        DATE

                                                                        DATE

                                                                        +

                                                                        DATE

                                                                        -

                                                                        +

                                                                        -

                                                                        YEAR

                                                                        +

                                                                        YEAR

                                                                        DATE

                                                                        +

                                                                        DATE

                                                                        -

                                                                        +

                                                                        -

                                                                        DATETIME

                                                                        +

                                                                        DATETIME

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        -

                                                                        +

                                                                        -

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        -

                                                                        +

                                                                        -

                                                                        TIME

                                                                        +

                                                                        TIME

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        Character

                                                                        +

                                                                        Character

                                                                        CHAR(N)

                                                                        +

                                                                        CHAR(N)

                                                                        CHAR(N*3)

                                                                        +

                                                                        CHAR(N*3)

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        VARCHAR(N)

                                                                        +

                                                                        VARCHAR(N)

                                                                        VARCHAR(N*3)

                                                                        +

                                                                        VARCHAR(N*3)

                                                                        If the value is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        VARBINARY

                                                                        +

                                                                        VARBINARY

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        TINYBLOB

                                                                        +

                                                                        TINYBLOB

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        MEDIUMBLOB

                                                                        +

                                                                        MEDIUMBLOB

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        BLOB

                                                                        +

                                                                        BLOB

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        LONGBLOB

                                                                        +

                                                                        LONGBLOB

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        TINYTEXT

                                                                        +

                                                                        TINYTEXT

                                                                        VARCHAR(765)

                                                                        +

                                                                        VARCHAR(765)

                                                                        -

                                                                        +

                                                                        -

                                                                        MEDIUMTEXT

                                                                        +

                                                                        MEDIUMTEXT

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        TEXT

                                                                        +

                                                                        TEXT

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        LONGTEXT

                                                                        +

                                                                        LONGTEXT

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        Others

                                                                        +

                                                                        Others

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        -
                                                                        -
                                                                        Table 2 Field mapping in automatic table creation for Oracle-to-Hive migration

                                                                        Data Type (Oracle)

                                                                        +
                                                                        - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
                                                                        Table 2 Field mapping in automatic table creation for Oracle-to-Hive migration

                                                                        Data Type (Oracle)

                                                                        Data Type (Hive)

                                                                        +

                                                                        Data Type (Hive)

                                                                        Description

                                                                        +

                                                                        Description

                                                                        Character

                                                                        +

                                                                        Character

                                                                        CHAR(N)

                                                                        +

                                                                        CHAR(N)

                                                                        CHAR(N*3)

                                                                        +

                                                                        CHAR(N*3)

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        VARCHAR(N)

                                                                        +

                                                                        VARCHAR(N)

                                                                        VARCHAR(N*3)

                                                                        +

                                                                        VARCHAR(N*3)

                                                                        If the value is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        VARCHAR2

                                                                        +

                                                                        VARCHAR2

                                                                        VARCHAR(N*3)

                                                                        +

                                                                        VARCHAR(N*3)

                                                                        If the value is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        NCHAR

                                                                        +

                                                                        NCHAR

                                                                        CHAR(N*3)

                                                                        +

                                                                        CHAR(N*3)

                                                                        -

                                                                        +

                                                                        -

                                                                        NVARCHAR2

                                                                        +

                                                                        NVARCHAR2

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        Value

                                                                        +

                                                                        Value

                                                                        NUMBER

                                                                        +

                                                                        NUMBER

                                                                        DECIMAL(P,S)

                                                                        +

                                                                        DECIMAL(P,S)

                                                                        For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        +

                                                                        For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        BINARY_FLOAT

                                                                        +

                                                                        BINARY_FLOAT

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        -

                                                                        +

                                                                        -

                                                                        BINARY_DOUBLE

                                                                        +

                                                                        BINARY_DOUBLE

                                                                        DOUBLE

                                                                        +

                                                                        DOUBLE

                                                                        -

                                                                        +

                                                                        -

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        -

                                                                        +

                                                                        -

                                                                        Time

                                                                        +

                                                                        Time

                                                                        DATE

                                                                        +

                                                                        DATE

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        -

                                                                        +

                                                                        -

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        -

                                                                        +

                                                                        -

                                                                        TIMESTAMP WITH TIME ZONE

                                                                        +

                                                                        TIMESTAMP WITH TIME ZONE

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        TIMESTAMP WITH LOCAL TIME ZONE

                                                                        +

                                                                        TIMESTAMP WITH LOCAL TIME ZONE

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        INTERVAL

                                                                        +

                                                                        INTERVAL

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        Binary

                                                                        +

                                                                        Binary

                                                                        BLOB

                                                                        +

                                                                        BLOB

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        CLOB

                                                                        +

                                                                        CLOB

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        NCLOB

                                                                        +

                                                                        NCLOB

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        LONG

                                                                        +

                                                                        LONG

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        LONG_RAW

                                                                        +

                                                                        LONG_RAW

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        RAW

                                                                        +

                                                                        RAW

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        Other

                                                                        +

                                                                        Other

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        -
                                                                        @@ -25,7 +25,7 @@ - @@ -36,7 +36,7 @@

                                                                        This method only obtains the parameter values configured for the current job, but not parameter values passed from the parent job or the global variables configured for the workspace.

                                                                        To obtain the parameter values passed from the parent job and the global variables configured for the workspace, you are advised to use the ${job_param_name} expression.

                                                                        - @@ -44,7 +44,7 @@ - @@ -52,7 +52,7 @@ - @@ -60,7 +60,7 @@ - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5098.html b/docs/dataartsstudio/umn/dataartsstudio_01_5098.html index 1783cc480..d9089c47f 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_5098.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5098.html @@ -1,27 +1,19 @@ -

                                                                        Enterprise Mode

                                                                        +

                                                                        (Optional) Creating and Using a Workspace in Enterprise Mode

                                                                        diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5099.html b/docs/dataartsstudio/umn/dataartsstudio_01_5099.html index c56ef2b1f..4c562ba42 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_5099.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5099.html @@ -1,6 +1,6 @@ -

                                                                        DataArts Studio Enterprise Mode Overview

                                                                        +

                                                                        Introduction to the Enterprise Mode

                                                                        DataArts Studio provides two workspace modes, the simplified mode and enterprise mode, to help you manage your production data with varied security control requirements. This section describes the differences between the two modes from multiple dimensions, such as the physical form and impact on development.

                                                                        Currently, only Management Center and DataArts Factory support the enterprise mode.

                                                                        @@ -43,26 +43,26 @@
                                                                        Table 3 Field mapping in automatic table creation for PostgreSQL/DWS-to-Hive migration

                                                                        Data Type (PostgreSQL/DWS)

                                                                        +
                                                                        - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
                                                                        Table 3 Field mapping in automatic table creation for PostgreSQL/DWS-to-Hive migration

                                                                        Data Type (PostgreSQL/DWS)

                                                                        Data Type (Hive)

                                                                        +

                                                                        Data Type (Hive)

                                                                        Description

                                                                        +

                                                                        Description

                                                                        Value

                                                                        +

                                                                        Value

                                                                        int2

                                                                        +

                                                                        int2

                                                                        SMALLINT

                                                                        +

                                                                        SMALLINT

                                                                        -

                                                                        +

                                                                        -

                                                                        int4

                                                                        +

                                                                        int4

                                                                        INT

                                                                        +

                                                                        INT

                                                                        -

                                                                        +

                                                                        -

                                                                        int8

                                                                        +

                                                                        int8

                                                                        BIGINT

                                                                        +

                                                                        BIGINT

                                                                        -

                                                                        +

                                                                        -

                                                                        real

                                                                        +

                                                                        real

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        -

                                                                        +

                                                                        -

                                                                        float4

                                                                        +

                                                                        float4

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        -

                                                                        +

                                                                        -

                                                                        float8

                                                                        +

                                                                        float8

                                                                        DOUBLE

                                                                        +

                                                                        DOUBLE

                                                                        -

                                                                        +

                                                                        -

                                                                        smallserial

                                                                        +

                                                                        smallserial

                                                                        SMALLINT

                                                                        +

                                                                        SMALLINT

                                                                        -

                                                                        +

                                                                        -

                                                                        serial

                                                                        +

                                                                        serial

                                                                        INT

                                                                        +

                                                                        INT

                                                                        -

                                                                        +

                                                                        -

                                                                        bigserial

                                                                        +

                                                                        bigserial

                                                                        BIGINT

                                                                        +

                                                                        BIGINT

                                                                        -

                                                                        +

                                                                        -

                                                                        numeric(p,s)

                                                                        +

                                                                        numeric(p,s)

                                                                        DECIMAL(P,S)

                                                                        +

                                                                        DECIMAL(P,S)

                                                                        For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        +

                                                                        For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        money

                                                                        +

                                                                        money

                                                                        DOUBLE

                                                                        +

                                                                        DOUBLE

                                                                        -

                                                                        +

                                                                        -

                                                                        bit(1)

                                                                        +

                                                                        bit(1)

                                                                        TINYINT

                                                                        +

                                                                        TINYINT

                                                                        -

                                                                        +

                                                                        -

                                                                        varbit

                                                                        +

                                                                        varbit

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        Character

                                                                        +

                                                                        Character

                                                                        varchar(n)

                                                                        +

                                                                        varchar(n)

                                                                        VARCHAR(N*3)

                                                                        +

                                                                        VARCHAR(N*3)

                                                                        If the value is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        bpchar(n)

                                                                        +

                                                                        bpchar(n)

                                                                        CHAR(N*3)

                                                                        +

                                                                        CHAR(N*3)

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        char(n)

                                                                        +

                                                                        char(n)

                                                                        CHAR(N*3)

                                                                        +

                                                                        CHAR(N*3)

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        bytea

                                                                        +

                                                                        bytea

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        text

                                                                        +

                                                                        text

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        Time

                                                                        +

                                                                        Time

                                                                        interval

                                                                        +

                                                                        interval

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        date

                                                                        +

                                                                        date

                                                                        DATE

                                                                        +

                                                                        DATE

                                                                        -

                                                                        +

                                                                        -

                                                                        time

                                                                        +

                                                                        time

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        timetz

                                                                        +

                                                                        timetz

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        timestamp

                                                                        +

                                                                        timestamp

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        -

                                                                        +

                                                                        -

                                                                        timestamptz

                                                                        +

                                                                        timestamptz

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        -

                                                                        +

                                                                        -

                                                                        Boolean

                                                                        +

                                                                        Boolean

                                                                        bool

                                                                        +

                                                                        bool

                                                                        BOOLEAN

                                                                        +

                                                                        BOOLEAN

                                                                        -

                                                                        +

                                                                        -

                                                                        Other

                                                                        +

                                                                        Other

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        -
                                                                        + + + +
                                                                        Table 4 Field mapping in automatic table creation for SQL Server-to-Hive migration

                                                                        Data Type (SQL Server)

                                                                        +
                                                                        - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - @@ -849,3 +850,10 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_2515.html b/docs/dataartsstudio/umn/dataartsstudio_01_2515.html deleted file mode 100644 index 6b0bd25b2..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_01_2515.html +++ /dev/null @@ -1,56 +0,0 @@ - - -

                                                                        Managing Terminal Subscriptions

                                                                        -

                                                                        Scenario

                                                                        You can configure terminal subscriptions (SMS messages, emails, and phone calls) by owner. After configuring a subscription, you can use the Manage Notification function to configure a job notification task. When a job runs abnormally or successfully, notifications are sent to the configured owners.

                                                                        -
                                                                        -

                                                                        Prerequisites

                                                                        Message notification has been enabled and a topic has been configured. Before configuring subscriptions by owner, ensure that you have set a job alarm notification topic for the workspace.

                                                                        -
                                                                        -

                                                                        Creating a Notification

                                                                        1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                        2. In the left navigation pane on the DataArts Factory console, choose Configuration > Configure. Choose Default Configuration. For details about how to configure alarm notification topics for workspace jobs by owner, see Job Alarm Notification Topic. If you have configured an alarm notification topic, skip this step.
                                                                          Figure 1 Setting Job Alarm Notification Topic
                                                                          -

                                                                          -
                                                                        3. In the navigation pane on the DataArts Factory page, choose Monitoring > Manage Notification.
                                                                        4. Click the Terminal Subscriptions tab and click Add Subscription. In the displayed dialog box, set required parameters.
                                                                          Figure 2 Adding a subscription
                                                                          -

                                                                          - -
                                                                        Table 4 Field mapping in automatic table creation for SQL Server-to-Hive migration

                                                                        Data Type (SQL Server)

                                                                        Data Type (Hive)

                                                                        +

                                                                        Data Type (Hive)

                                                                        Description

                                                                        +

                                                                        Description

                                                                        Value

                                                                        +

                                                                        Value

                                                                        TINYINT

                                                                        +

                                                                        TINYINT

                                                                        SMALLINT

                                                                        +

                                                                        SMALLINT

                                                                        -

                                                                        +

                                                                        -

                                                                        SMALLINT

                                                                        +

                                                                        SMALLINT

                                                                        SMALLINT

                                                                        +

                                                                        SMALLINT

                                                                        -

                                                                        +

                                                                        -

                                                                        INT

                                                                        +

                                                                        INT

                                                                        INT

                                                                        +

                                                                        INT

                                                                        -

                                                                        +

                                                                        -

                                                                        BIGINT

                                                                        +

                                                                        BIGINT

                                                                        BIGINT

                                                                        +

                                                                        BIGINT

                                                                        -

                                                                        +

                                                                        -

                                                                        DECIMAL

                                                                        +

                                                                        DECIMAL

                                                                        DECIMAL(P,S)

                                                                        +

                                                                        DECIMAL(P,S)

                                                                        For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        +

                                                                        For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        NUMERIC

                                                                        +

                                                                        NUMERIC

                                                                        DECIMAL(P,S)

                                                                        +

                                                                        DECIMAL(P,S)

                                                                        For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        +

                                                                        For Hive, the precision is greater than or equal to 1 and less than or equal to 38, and the scale is greater than or equal to 0. If the precision for the MySQL database is greater than 38 bits, the precision for Hive table creation is 38 bits. If the scale is less than 0, the scale for Hive table creation is 0.

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        DOUBLE

                                                                        +

                                                                        DOUBLE

                                                                        -

                                                                        +

                                                                        -

                                                                        REAL

                                                                        +

                                                                        REAL

                                                                        FLOAT

                                                                        +

                                                                        FLOAT

                                                                        -

                                                                        +

                                                                        -

                                                                        SMALLMONEY

                                                                        +

                                                                        SMALLMONEY

                                                                        DECIMAL(10,4)

                                                                        +

                                                                        DECIMAL(10,4)

                                                                        -

                                                                        +

                                                                        -

                                                                        MONEY

                                                                        +

                                                                        MONEY

                                                                        DECIMAL(19,4)

                                                                        +

                                                                        DECIMAL(19,4)

                                                                        -

                                                                        +

                                                                        -

                                                                        BIT(1)

                                                                        +

                                                                        BIT(1)

                                                                        TINYINT

                                                                        +

                                                                        TINYINT

                                                                        -

                                                                        +

                                                                        -

                                                                        Time

                                                                        +

                                                                        Time

                                                                        DATE

                                                                        +

                                                                        DATE

                                                                        DATE

                                                                        +

                                                                        DATE

                                                                        -

                                                                        +

                                                                        -

                                                                        DATETIME

                                                                        +

                                                                        DATETIME

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        -

                                                                        +

                                                                        -

                                                                        DATETIME2

                                                                        +

                                                                        DATETIME2

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        -

                                                                        +

                                                                        -

                                                                        DATETIMEOFFSET

                                                                        +

                                                                        DATETIMEOFFSET

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        TIME(p)

                                                                        +

                                                                        TIME(p)

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        TIMESTAMP

                                                                        +

                                                                        TIMESTAMP

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        Character

                                                                        +

                                                                        Character

                                                                        CHAR(n)

                                                                        +

                                                                        CHAR(n)

                                                                        CHAR(n*3)

                                                                        +

                                                                        CHAR(n*3)

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65535 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        VARCHAR(n)

                                                                        +

                                                                        VARCHAR(n)

                                                                        VARCHAR(n*3)

                                                                        +

                                                                        VARCHAR(n*3)

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65536 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65536 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        NCHAR(n)

                                                                        +

                                                                        NCHAR(n)

                                                                        VARCHAR(n*3)

                                                                        +

                                                                        VARCHAR(n*3)

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65537 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65537 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        NVARCHAR(n)

                                                                        +

                                                                        NVARCHAR(n)

                                                                        VARCHAR(n*3)

                                                                        +

                                                                        VARCHAR(n*3)

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65538 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        +

                                                                        If the value of (n*3<255) is greater than 255 (CHAR_MAX_LENGTH), varchar(N*3) is created. If the value of (n*3<255) is greater than 65538 (VARCHAR_MAX_LENGTH), a string is created.

                                                                        Binary

                                                                        +

                                                                        Binary

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        VARBINARY

                                                                        +

                                                                        VARBINARY

                                                                        BINARY

                                                                        +

                                                                        BINARY

                                                                        -

                                                                        +

                                                                        -

                                                                        TEXT

                                                                        +

                                                                        TEXT

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        Other

                                                                        +

                                                                        Other

                                                                        STRING

                                                                        +

                                                                        STRING

                                                                        -

                                                                        +

                                                                        -

                                                                        - - - - - - - - - - - - - - - - - -
                                                                        Table 1 Parameters for adding a subscription

                                                                        Parameter

                                                                        -

                                                                        Mandatory

                                                                        -

                                                                        Description

                                                                        -

                                                                        Owner

                                                                        -

                                                                        Yes

                                                                        -

                                                                        Set the subscription owner, which was configured during job creation.

                                                                        -

                                                                        Terminal Protocol

                                                                        -

                                                                        Yes

                                                                        -
                                                                        • SMS
                                                                        • Email
                                                                        • Phone
                                                                        -

                                                                        Terminal information

                                                                        -

                                                                        Yes

                                                                        -

                                                                        Set the information about the terminal.

                                                                        -
                                                                        -
                                                                        -
                                                                      4. Click OK.
                                                                      5. After the terminal subscription is created, you can perform the following operations on the notification:
                                                                        • Click Request Subscription. In the displayed dialog box, the subscription status is Unconfirmed. After you click OK, the subscription status becomes Confirmed.
                                                                        • Click Delete. In the Delete Subscription dialog box, click OK to delete the subscription.

                                                                          You can request or delete subscriptions, but cannot edit them.

                                                                          -
                                                                          -
                                                                        -
                                                                      6. After the preceding operations are complete, configure job alarm notifications by owner on the Managing Notifications page.
                                                                      7. - - -
                                                                        - -
                                                                        - diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_4105.html b/docs/dataartsstudio/umn/dataartsstudio_01_4105.html new file mode 100644 index 000000000..f696620cc --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_4105.html @@ -0,0 +1,34 @@ + + +

                                                                        Managing DataArts Studio Resources

                                                                        +

                                                                        You can centrally manage DataArts Studio resources.

                                                                        +

                                                                        Offline Resource Management

                                                                        You can view all CDM clusters in a DataArts Studio instance and associate workspaces with CDM clusters.

                                                                        +

                                                                        A CDM cluster is available in a workspace only after they are associated with each other.

                                                                        +
                                                                        +
                                                                        1. Log in to the DataArts Studio console as user DARTS Administrator or Tenant Administrator. For details, see Accessing the DataArts Studio Instance Console.
                                                                        2. Locate an instance and click Access. Then click the Resources tab.
                                                                        3. On the Offline Resources tab page, view all CDM clusters in the instance, such as their statuses, private IP addresses, and public IP addresses.

                                                                          +

                                                                        4. Click in the Name column to expand the cluster details, such as the AZ, VPC, subnet, security group, specifications, cluster ID, and associated workspaces.

                                                                          Figure 1 Viewing cluster details
                                                                          +

                                                                          +

                                                                        5. Locate a CDM cluster and click Associate with Workspace in the Operation column. In the displayed dialog box, select or deselect workspaces and click OK to associate the CDM cluster with the selected workspaces.

                                                                          The CDM cluster is only available in the associated workspaces.
                                                                          Figure 2 Associating a CDM cluster with workspaces
                                                                          +
                                                                          +

                                                                          +

                                                                        +
                                                                        +
                                                                        + + + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_4500.html b/docs/dataartsstudio/umn/dataartsstudio_01_4500.html index a7839a34a..157b31aaa 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_4500.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_4500.html @@ -66,7 +66,7 @@

                                                                        Yes

                                                                        Whether to re-execute a node if it fails to be executed. Possible values:

                                                                        -
                                                                        • Yes: The node will be re-executed, and the following parameters must be configured:
                                                                          • Retry upon Timeout
                                                                          • Maximum Retries
                                                                          • Retry Interval (seconds)
                                                                          +
                                                                          • Yes: The node will be re-executed, and the following parameters must be configured:
                                                                            • Retry upon Timeout
                                                                            • Maximum Retries
                                                                            • Retry Interval (seconds)
                                                                          • No: The node will not be re-executed. This is the default setting.
                                                                            NOTE:

                                                                            If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                                            If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                                            Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                                                            @@ -89,6 +89,13 @@

                                                                        If you select this option, the node will not be executed, and a success message will be returned.

                                                                        Task Groups

                                                                        +

                                                                        No

                                                                        +

                                                                        Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                                        +
                                                                        diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_4503.html b/docs/dataartsstudio/umn/dataartsstudio_01_4503.html index a8f32b7bb..be6ade77b 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_4503.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_4503.html @@ -3,9 +3,9 @@

                                                                        Developing a Python Script

                                                                        DataArts Factory allows you to develop, debug, and run Python scripts online. You can run developed scripts in jobs. For details, see Developing a Pipeline Job.

                                                                        For details about how to develop a Python scripts, see Developing a Python Script.

                                                                        -

                                                                        Prerequisites

                                                                        • A Python script has been added. For details, see Creating a Script.
                                                                        • A host connection has been created. The Linux host is used to execute Python scripts. For details about how to create a host connection, see Configuring a Host Connection.
                                                                        • You have the permission to create and execute files in the /tmp directory on the host.
                                                                        • The maximum number of shell or Python scripts that can run concurrently on the ECS is determined by the value of MaxSessions in the /etc/ssh/sshd_config file on the ECS. Set MaxSessions based on the scheduling frequency of shell or Python scripts.
                                                                        • You have locked the script. Otherwise, you must click Lock so that you can develop the script. A script you create or import is locked by you by default. For details, see the lock function.
                                                                        +

                                                                        Prerequisites

                                                                        • A Python script has been added. For details, see Creating a Script.
                                                                        • A host connection has been created. The Linux host is used to execute Python scripts. For details about how to create a host connection, see Host Connection Parameters.
                                                                        • You have the permission to create and execute files in the /tmp directory on the host.
                                                                        • The maximum number of shell or Python scripts that can run concurrently on the ECS is determined by the value of MaxSessions in the /etc/ssh/sshd_config file on the ECS. Set MaxSessions based on the scheduling frequency of shell or Python scripts.
                                                                        • You have locked the script. Otherwise, you must click Lock so that you can develop the script. A script you create or import is locked by you by default. For details, see the lock function.
                                                                        -

                                                                        Procedure

                                                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                        2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                        3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                        4. In the script directory list, double-click a script that you want to develop. The script development page is displayed.
                                                                        5. In the upper part of the editor, configure the Python version and the host connection for executing the Python script. +

                                                                          Procedure

                                                                          1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                          2. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                          3. In the left navigation pane of DataArts Factory, choose Data Development > Develop Script.
                                                                          4. In the script directory list, double-click a script that you want to develop. The script development page is displayed.
                                                                          5. In the upper part of the editor, configure the Python version and the host connection for executing the Python script.
                                                                            Table 1 Python script properties

                                                                            Parameter

                                                                            Description

                                                                            @@ -47,18 +47,24 @@
                                                                            -
                                                                          6. Edit Python statements in the editor. To facilitate script development, DataArts Factory provides the following capabilities:
                                                                            • The script editor supports the following shortcut keys, which improve the script development efficiency:
                                                                              • F8: Run a script.
                                                                              • F9: Stop running a script.
                                                                              • Ctrl + /: Comment out or uncomment the line or code block where the cursor resides.
                                                                              • Ctrl + S: Save a script.
                                                                              • Ctrl + Z: Undo an action.
                                                                              • Ctrl + F: Search for information.
                                                                              • Ctrl + Shift + R: Replace
                                                                              • Ctrl + X: Cut (Cut a line when the cursor selects nothing.)
                                                                              • Alt + mouse dragging: Select columns to edit a block.
                                                                              • Ctrl + mouse click: Select multiple lines to edit or indent them together.
                                                                              • Shift + Ctrl + K: Delete the current line.
                                                                              • Ctrl + (or ): Move the cursor rightwards (or leftwards) by word.
                                                                              • Ctrl + Home or Ctrl + End: Navigate to the beginning or end of the current file.
                                                                              • Home or End: Navigate to the beginning or end of the current line.
                                                                              • Ctrl + Shift + L: Double-click all the same character strings and add cursors to them to implement batch modification.
                                                                              • Ctrl + D: Delete a line.
                                                                              • Shift + Ctrl + U: Unlock a script.
                                                                              • Ctrl + Alt + K: Select the word where the cursor resides.
                                                                              • Ctrl + B: Format
                                                                              • Ctrl + Shift + Z: Redo
                                                                              • Ctrl + Enter: Execute the selected line or content.
                                                                              • Ctrl + Alt + F: Flag
                                                                              • Ctrl + Shift + K: Search for the previous one.
                                                                              • Ctrl + K: Search for the next one.
                                                                              • Ctrl + Backspace: Delete the word to the left of the cursor.
                                                                              • Ctrl + Delete: Delete the word to the right of the cursor.
                                                                              • Alt + Backspace: Delete all content from the beginning of the line to the cursor.
                                                                              • Alt + Delete: Delete all content from the cursor to the end of the line.
                                                                              • Alt + Shift-Left: Select all content from the beginning of the line to the cursor.
                                                                              • Alt + Shift-Right: Select all content from the cursor to the end of the line.
                                                                              -
                                                                            • Script parameter function. Use this function in either of the following ways:
                                                                              1. Write the script parameter name and parameter value in the Python statement. When the Python script is referenced by a job, if the parameter name configured for the job is the same as the parameter name of the Python script, the parameter value of the Python script is replaced by the parameter value of the job.
                                                                                The following is an example script:
                                                                                a=1
                                                                                -print {a}
                                                                                +
                                                                              2. Edit Python statements in the editor. To facilitate script development, DataArts Factory provides the following capabilities:
                                                                                • The script editor supports the following shortcut keys, which improve the script development efficiency:
                                                                                  • F8: Run a script.
                                                                                  • F9: Stop running a script.
                                                                                  • Ctrl + /: Comment out or uncomment the line or code block where the cursor resides.
                                                                                  • Ctrl + S: Save a script.
                                                                                  • Ctrl + Z: Undo an action.
                                                                                  • Ctrl + F: Search for information.
                                                                                  • Ctrl + Shift + R: Replace
                                                                                  • Ctrl + X: Cut (Cut a line when the cursor selects nothing.)
                                                                                  • Alt + mouse dragging: Select columns to edit a block.
                                                                                  • Ctrl + mouse click: Select multiple lines to edit or indent them together.
                                                                                  • Ctrl + (or ): Move the cursor rightwards (or leftwards) by word.
                                                                                  • Ctrl + Home or Ctrl + End: Navigate to the beginning or end of the current file.
                                                                                  • Home or End: Navigate to the beginning or end of the current line.
                                                                                  • Ctrl + Shift + L: Double-click all the same character strings and add cursors to them to implement batch modification.
                                                                                  • Ctrl + D: Delete a line.
                                                                                  • Shift + Ctrl + U: Unlock a script.
                                                                                  • Ctrl + Alt + K: Select the word where the cursor resides.
                                                                                  • Ctrl + B: Format
                                                                                  • Ctrl + Shift + Z: Redo
                                                                                  • Ctrl + Enter: Execute the selected line or content.
                                                                                  • Ctrl + Alt + F: Flag
                                                                                  • Ctrl + Shift + K: Search for the previous one.
                                                                                  • Ctrl + K: Search for the next one.
                                                                                  • Ctrl + Backspace: Delete the word to the left of the cursor.
                                                                                  • Ctrl + Delete: Delete the word to the right of the cursor.
                                                                                  • Alt + Backspace: Delete all content from the beginning of the line to the cursor.
                                                                                  • Alt + Delete: Delete all content from the cursor to the end of the line.
                                                                                  • Alt + Shift-Left: Select all content from the beginning of the line to the cursor.
                                                                                  • Alt + Shift-Right: Select all content from the cursor to the end of the line.
                                                                                  +
                                                                                • Script parameter function. Use this function in either of the following ways:
                                                                                  1. Write the script parameter name and parameter value in the Python statement. When the Python script is referenced by a job, if the parameter name configured for the job is the same as the parameter name of the Python script, the parameter value of the Python script is replaced by the parameter value of the job.
                                                                                    Transfer parameters in the script. The following is an example script:
                                                                                    a=1
                                                                                    +print (a)
                                                                                    +or
                                                                                    +a= 'qqq'
                                                                                    +print (a)
                                                                                    +
                                                                                    +
                                                                                    Transfer parameters outside the script. For example, if you want to transfer parameters of the Python script to a Python job which uses the Python script, enclose string parameters in single quotation marks. The following is an example script:
                                                                                    a= 'zhang'
                                                                                    +print (${a})

                                                                                    In the preceding command, a indicates the parameter name. It can contain only letters, digits, hyphens (-), underscores (_), greater-than signs (>), and less-than signs (<), and can contain a maximum of 16 characters. The parameter name must be unique.

                                                                                  2. Click Input Parameters and set parameters, which will be transferred to the Python script during execution of the script. Separate parameters by spaces, for example, a b c. The parameter must be referenced by the Python script. Otherwise, the parameter is invalid.
                                                                                • Owner

                                                                                  Click Basic Info to set the script owner and description.

                                                                                  -
                                                                                • The script cannot be larger than 16 MB.
                                                                                • Allows you to go to the release page from the script development page in enterprise mode. Place the cursor over and click Release.
                                                                                -
                                                                              3. In the upper part of the editor, click Execute. After executing the Python statement, view the execution history and result of the script in the lower part of the editor.
                                                                                You can perform the following operations on execution results:
                                                                                • Double-click or right-click the name of an execution result tab to rename it. The name can contain a maximum of 16 characters.
                                                                                • Right-click the name of an execution result tab to close the current tab, all the tabs to the left or right of the current tab, all the other tabs, or all the tabs.
                                                                                • The execution result of a Python script cannot be larger than 30 MB. Otherwise, an error is reported.
                                                                                +
                                                                              4. The script cannot be larger than 16 MB.
                                                                              5. Allows you to go to the release page from the script development page in enterprise mode. Place the cursor over and click Release.
                                                                            +
                                                                          7. In the upper part of the editor, click Execute. After executing the Python statement, view the execution history and result of the script in the lower part of the editor.
                                                                            You can perform the following operations on execution results:
                                                                            • Double-click or right-click the name of an execution result tab to rename it. The name can contain a maximum of 16 characters.
                                                                            • Right-click the name of an execution result tab to close the current tab, all the tabs to the left or right of the current tab, all the other tabs, or all the tabs.
                                                                            • The execution result of a Python script cannot be larger than 30 MB. Otherwise, an error is reported.
                                                                            • When viewing the script execution result, you can double-click a field in any row to view the result details. You can copy the field name.
                                                                            • You can control display of the script execution history by setting Script Execution History in Default Configuration to Myself or All users.
                                                                            -
                                                                          8. Above the editor, click to save the script.
                                                                            If the script is created but not saved, set the parameters listed in Table 3. +
                                                                          9. Above the editor, click Save to save the script.
                                                                            If the script is created but not saved, set the parameters listed in Table 3.
                                                                            + + + +
                                                                            Table 3 Script parameters

                                                                            Parameter

                                                                            Mandatory

                                                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_4504.html b/docs/dataartsstudio/umn/dataartsstudio_01_4504.html index 2163a0ba6..a2c3e5bb2 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_4504.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_4504.html @@ -115,6 +115,13 @@

                                                                            If you select this option, the node will not be executed, and a success message will be returned.

                                                                            Task Groups

                                                                            +

                                                                            No

                                                                            +

                                                                            Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                                            +
                                                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_4509.html b/docs/dataartsstudio/umn/dataartsstudio_01_4509.html new file mode 100644 index 000000000..5f4d3355e --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_4509.html @@ -0,0 +1,120 @@ + + +

                                                                            DORIS SQL

                                                                            +

                                                                            Functions

                                                                            The Doris SQL node transfers SQL statements to Doris for execution.

                                                                            +
                                                                            +

                                                                            Parameters

                                                                            Table 1 and Table 2 describe the parameters of the Doris SQL node.

                                                                            + +
                                                                            + + + + + + + + + + + + + + + + + + + + + +
                                                                            Table 1 Parameters of the Doris SQL node

                                                                            Parameter

                                                                            +

                                                                            Mandatory

                                                                            +

                                                                            Description

                                                                            +

                                                                            Node Name

                                                                            +

                                                                            Yes

                                                                            +

                                                                            Name of a node. The name must contain 1 to 128 characters, including only letters, numbers, underscores (_), hyphens (-), slashes (/), less-than signs (<), and greater-than signs (>).

                                                                            +

                                                                            By default, the node name is the same as that of the selected script. If you want the node name to be different from the script name, disable this function by referring to Disabling Auto Node Name Change.

                                                                            +

                                                                            SQL or Script

                                                                            +

                                                                            Yes

                                                                            +
                                                                            • SQL statement

                                                                              Click the text box under SQL statement and enter the SQL statement to be executed.

                                                                              +
                                                                            • SQL script

                                                                              Select a script to be executed. If no script is available, create and develop a script by referring to Creating a Script and Developing an SQL Script. If the associated SQL script uses a parameter, the parameter name is displayed. Set the parameter value in the text box next to the parameter name.

                                                                              +
                                                                              NOTE:

                                                                              If you select the SQL statement mode, the DataArts Factory module cannot parse the parameters contained in the SQL statement.

                                                                              +
                                                                              +
                                                                            +

                                                                            Data Connection

                                                                            +

                                                                            Yes

                                                                            +

                                                                            Select a data connection.

                                                                            +

                                                                            Database

                                                                            +

                                                                            Yes

                                                                            +

                                                                            Name of the database. The database has been created. You are advised not to use the default database.

                                                                            +
                                                                            +
                                                                            +
                                                                            + +
                                                                            + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
                                                                            Table 2 Advanced parameters

                                                                            Parameter

                                                                            +

                                                                            Mandatory

                                                                            +

                                                                            Description

                                                                            +

                                                                            Node Status Polling Interval (s)

                                                                            +

                                                                            Yes

                                                                            +

                                                                            How often the system check completeness of the node. The value ranges from 1 to 60 seconds.

                                                                            +

                                                                            Max. Node Execution Duration

                                                                            +

                                                                            Yes

                                                                            +

                                                                            Execution timeout interval for the node. If retry is configured and the execution is not complete within the timeout interval, the node will be executed again.

                                                                            +

                                                                            Retry upon Failure

                                                                            +

                                                                            Yes

                                                                            +

                                                                            Whether to re-execute a node if it fails to be executed. Possible values:

                                                                            +
                                                                            • Yes: The node will be re-executed, and the following parameters must be configured:
                                                                              • Retry upon Timeout
                                                                              • Maximum Retries
                                                                              • Retry Interval (seconds)
                                                                              +
                                                                            • No: The node will not be re-executed. This is the default setting.
                                                                              NOTE:

                                                                              If retry is configured for a job node and the timeout duration is configured, the system allows you to retry a node when the node execution times out.

                                                                              +

                                                                              If a node is not re-executed when it fails upon timeout, you can go to the Default Configuration page to modify this policy.

                                                                              +

                                                                              Retry upon Timeout is displayed only when Retry upon Failure is set to Yes.

                                                                              +
                                                                              +
                                                                            +

                                                                            Policy for Handling Subsequent Nodes If the Current Node Fails

                                                                            +

                                                                            Yes

                                                                            +

                                                                            Operation that will be performed if the node fails to be executed. Possible values:

                                                                            +
                                                                            • Suspend execution plans of the subsequent nodes: stops running subsequent nodes. The job instance status is Failed.
                                                                            • End the current job execution plan: stops running the current job. The job instance status is Failed.
                                                                            • Go to the next node: ignores the execution failure of the current node. The job instance status is Failure ignored.
                                                                            • Suspend the current job execution plan: If the current job instance is in abnormal state, the subsequent nodes of this node and the subsequent job instances that depend on the current job are in waiting state.
                                                                            +

                                                                            Enable Dry Run

                                                                            +

                                                                            No

                                                                            +

                                                                            If you select this option, the node will not be executed, and a success message will be returned.

                                                                            +

                                                                            Task Groups

                                                                            +

                                                                            No

                                                                            +

                                                                            Select a task group. If you select a task group, you can control the maximum number of concurrent nodes in the task group in a fine-grained manner in scenarios where a job contains multiple nodes, a data patching task is ongoing, or a job is rerunning.

                                                                            +
                                                                            +
                                                                            +
                                                                            +
                                                                            + +
                                                                            + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_4803.html b/docs/dataartsstudio/umn/dataartsstudio_01_4803.html index ecb753514..548b68878 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_4803.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_4803.html @@ -17,7 +17,7 @@

                                                                            For example, to check whether a node is running successfully, you can use the following command, where test indicates the node name:

                                                                            #{(Job.getNodeStatus("test")) == "success" }

                                                                            -

                                                                        Obtain the running status of the test node:

                                                                        +

                                                                        Obtains the running status of the test node:

                                                                        #{Job.getNodeStatus("test")}

                                                                        Obtains the output of a specified node. This method can only obtain the output of the previous dependent node.

                                                                        • Obtain the output of the test node:

                                                                          #{Job.getNodeOutput("test")}

                                                                          +
                                                                        • Obtains the output of the test node:

                                                                          #{Job.getNodeOutput("test")}

                                                                        • If the previous node has no execution result, the output is null.
                                                                        • If the output of a node is a field, the output result is in the format like [["000"]]. In this case, you can use the EL expression to split the string result and obtain the field value output by the previous node. Note that the output result type is string. If you want to output the original data type, you need to use the EL expression of the For Each node and the loop embedded objects supported by the node.

                                                                          #{StringUtil.split(StringUtil.split(StringUtil.split(Job.getNodeOutput("Name of the previous node"),"]")[0],"[")[0],"\\"")[0]}

                                                                        • If the output of a node contains two or more fields, the output result is in the format like [["000"],["001"]]. In this case, you need to obtain the output result using the EL expression of the For Each node and the loop embedded objects supported by the node, for example, #{Loop.current[0]}.

                                                                        Obtain the value of the test parameter:

                                                                        +

                                                                        Obtains the value of the test parameter:

                                                                        #{Job.getParam("test")}

                                                                        Obtains the plan time character string in a specified pattern. Pattern indicates the date and time mode. For details, see Date and Time Mode.

                                                                        Obtain the planned job scheduling time, which is accurate to millisecond:

                                                                        +

                                                                        Obtains the planned job scheduling time, which is accurate to millisecond:

                                                                        #{Job.getPlanTime("yyyy-MM-dd HH:mm:ss:SSS")}

                                                                        Obtains the time character string of the day before the plan time. Pattern indicates the date and time mode. For details, see Date and Time Mode.

                                                                        Obtain the time on the previous day of the planned job scheduling time, which is accurate to date:

                                                                        +

                                                                        Obtains the time on the previous day of the planned job scheduling time, which is accurate to date:

                                                                        #{Job.getYesterday("yyyy-MM-dd HH:mm:ss:SSS")}

                                                                        Obtains the time character string of last hour before the plan time. Pattern indicates the date and time mode. For details, see Date and Time Mode.

                                                                        Obtain the time one hour before the planned job scheduling time, which is accurate to hour:

                                                                        +

                                                                        Obtains the time one hour before the planned job scheduling time, which is accurate to hour:

                                                                        #{Job.getLastHour("yyyy-MM-dd HH:mm:ss:SSS")}

                                                                        -

                                                                        Important Notes

                                                                        • Different workspace modes have certain requirements on the data lake engine. To isolate the development environment from the production environment of a workspace that uses the enterprise mode, you must configure a data lake engine for both environments. You can configure isolation between the development and production environments using any of the methods shown in the following figure.
                                                                          Figure 1 Configuring isolation between the development and production environments
                                                                          -
                                                                          • Configure two sets of data lake services to isolate the development environment from the production environment.

                                                                            For clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, DIS, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services that have the same version, specifications, components, region, VPC, subnet, and other related configurations. For details, see Creating a Data Connection.

                                                                            +

                                                                            Important Notes

                                                                            • Different workspace modes have certain requirements on the data lake engine. To isolate the development environment from the production environment of a workspace that uses the enterprise mode, you must configure a data lake engine for both environments. You can configure isolation between the development and production environments using any of the methods shown in the following figure.
                                                                              Figure 1 Configuring isolation between the development and production environments
                                                                              +
                                                                              • Configure two sets of data lake services to isolate the development environment from the production environment.

                                                                                For clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services that have the same version, specifications, components, region, VPC, subnet, and other related configurations. For details, see Creating a DataArts Studio Data Connection.

                                                                                When creating a data connection, you can select different clusters for the development environment and production environment to isolate them.

                                                                                -
                                                                                Figure 2 Selecting different clusters during data connection creation
                                                                                +
                                                                                Figure 2 Selecting different clusters during data connection creation

                                                                              • Configure environment isolation for DLI.

                                                                                Configure environment isolation in enterprise mode, including DLI queue configuration and DB configuration.

                                                                                -

                                                                                For serverless services (such as DLI), you can configure the mapping between data lake services in the production environment and those in the development environment through environment isolation in Management Center. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.

                                                                                +

                                                                                For serverless services (such as DLI), you can configure the mapping between data lake services in the production environment and those in the development environment through environment isolation in Management Center. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.

                                                                              • Configure two databases in the same data lake service to isolate the development environment from the production environment.

                                                                                For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection (as shown in Figure 3), you must configure database mapping on the Configure Data Source Resource Mapping page shown in Figure 4 to isolate the development and production environments. For details, see DB configuration.

                                                                                -
                                                                                Figure 3 Selecting the same cluster during data connection creation
                                                                                +
                                                                                Figure 3 Selecting the same cluster during data connection creation

                                                                                -
                                                                                Figure 4 DB Configuration
                                                                                +
                                                                                Figure 4 DB Configuration

                                                                            • Data development jobs in the development environment of a workspace that uses the enterprise mode are not scheduled by default. They can be scheduled only after released to the production environment.

                                                                            Introduction to the Simple Mode and Enterprise Mode

                                                                            Typically, DataArts Studio workspaces use the simple mode. In this mode, you cannot isolate the development and production environment in the DataArts Factory and Management Center modules of DataArts Studio, or control the data development process or table permissions. Instead, you can only perform simple data development operations. A data lake functions as the production environment of DataArts Studio.

                                                                            -
                                                                            Figure 5 A workspace using the simple mode
                                                                            +
                                                                            Figure 5 A workspace using the simple mode
                                                                            The enterprise mode of DataArts Studio workspaces eliminates the risks of the simple mode. In this mode, you can isolate the development environment from the production environment in the DataArts Factory and Management Center modules of DataArts Studio. This prevents developers' operations from affecting services in the production environment. This mode requires two data lakes, one as the development environment and the other as the production environment.
                                                                            • The development environment is accessible only to developers for script and job development and release of scripts and jobs to the production environment.
                                                                            • The production environment is accessible only to end users and allows no change. Any change that is required must be made in the development environment and released to the production environment again.
                                                                            -
                                                                            Figure 6 A workspace using the enterprise mode
                                                                            +
                                                                            Figure 6 A workspace using the enterprise mode
                                                                            • You can create a workspace in either mode to experience DataArts Studio. With a workspace in enterprise mode, you can isolate the code, compute resources, and permissions of the development environment from those of the production environment, and manage the task release process.
                                                                            • If you are using a workspace in simple mode and want to experience the enterprise mode while retaining the code of the workspace, you can upgrade the workspace. For details, see Creating a Workspace in Enterprise Mode.
                                                                            @@ -77,7 +77,7 @@

                                                                        Management of the production task development process

                                                                        • After a task is submitted, it can be periodically executed to generate result data without being released.
                                                                        +

                                                                        After a task is submitted, it can be periodically executed to generate result data without being released.

                                                                        The process is submission and then production.

                                                                        • You need to submit a task to the development environment and release the task to the production environment. Then the task can be automatically executed.
                                                                        @@ -138,8 +138,8 @@
                                                                        -

                                                                        Process of Using DataArts Studio in Different Workspace Modes

                                                                        • In the simple mode, you cannot isolate the development and production environment in the DataArts Factory and Management Center modules of DataArts Studio, or control the data development process or table permissions. Instead, you can only perform simple data development operations. After submitting a script or job, you do not need to release it. The script or job can be periodically executed to generate result data.
                                                                          Figure 7 Process in simple mode
                                                                          -
                                                                        • In the enterprise mode, you can isolate the development environment from the production environment in the DataArts Factory and Management Center modules of DataArts Studio. This prevents developers' operations from affecting services in the production environment. The development environment is accessible only to developers for script and job development and release of scripts and jobs to the production environment. The production environment is accessible only to end users and allows no change. Any change that is required must be made in the development environment and released to the production environment again.
                                                                          Figure 8 Process in enterprise mode
                                                                          +

                                                                          Process of Using DataArts Studio in Different Workspace Modes

                                                                          • In the simple mode, you cannot isolate the development and production environment in the DataArts Factory and Management Center modules of DataArts Studio, or control the data development process or table permissions. Instead, you can only perform simple data development operations. After submitting a script or job, you do not need to release it. The script or job can be periodically executed to generate result data.
                                                                            Figure 7 Process in simple mode
                                                                            +
                                                                          • In the enterprise mode, you can isolate the development environment from the production environment in the DataArts Factory and Management Center modules of DataArts Studio. This prevents developers' operations from affecting services in the production environment. The development environment is accessible only to developers for script and job development and release of scripts and jobs to the production environment. The production environment is accessible only to end users and allows no change. Any change that is required must be made in the development environment and released to the production environment again.
                                                                            Figure 8 Process in enterprise mode

                                                                          Operations Allowed by DataArts Studio Modules in Different Workspace Modes

                                                                          @@ -172,7 +172,14 @@
                                                                          + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5100.html b/docs/dataartsstudio/umn/dataartsstudio_01_5100.html index 9a0479511..c5ef5c825 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_5100.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5100.html @@ -2,7 +2,7 @@

                                                                          Service Process in Enterprise Mode

                                                                          The DataArts Studio enterprise mode mainly involves the Management Center and DataArts Factory components. The service process is completed by the admin, developer, deployer, and operator.

                                                                          -
                                                                          Figure 1 Enterprise mode architecture
                                                                          +
                                                                          Figure 1 Enterprise mode architecture
                                                                          • The admin performs operations such as preparing a data lake, configuring data connections and environment isolation, importing and exporting data, and configuring project user permissions.
                                                                          • The developer develops and tests scripts and jobs, and submits versions and release tasks in the development environment.
                                                                          • The deployer reviews the submitted tasks in the development environment.
                                                                          • The operator performs operations such as job monitoring, notification management, and backup in the production environment based on the resources released by the developer.
                                                                          • Custom role: You can customize operation permissions to meet your requirements.
                                                                          • The viewer can only read data from DataArts Studio, but cannot perform operations or modify work items or configurations. You are advised to assign this role to users who only want to view information in the workspace.
                                                                            @@ -54,7 +54,14 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5101.html b/docs/dataartsstudio/umn/dataartsstudio_01_5101.html index f5f66bebd..1258c4a55 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_5101.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5101.html @@ -12,11 +12,11 @@ @@ -25,26 +25,20 @@ - - - - - @@ -54,7 +48,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5102.html b/docs/dataartsstudio/umn/dataartsstudio_01_5102.html index cfed27b43..9dc9d437b 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_5102.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5102.html @@ -27,7 +27,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5103.html b/docs/dataartsstudio/umn/dataartsstudio_01_5103.html index 7dff7c066..d8f023900 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_5103.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5103.html @@ -6,16 +6,23 @@

                                                                            Prerequisites

                                                                            The developer has completed the operations in Releasing a Script Task or Releasing a Job Task.

                                                                            Procedure

                                                                            1. On the DataArts Studio console, locate a workspace and click DataArts Factory.
                                                                            2. In the left navigation pane, choose Data Development > Task Release.
                                                                            3. Click the Packages tab. You can click View Details in the Operation column to view the changes of the task compared with its previous version.

                                                                              • If there is any issue, click Revoke to reject the release task. After the developer modifies and submits the release task again, you can review it again.
                                                                              • After confirming that the release task has no remaining issue, click Release to approve the task.
                                                                              -
                                                                              Figure 1 Reviewing and releasing a task
                                                                              +
                                                                              Figure 1 Reviewing and releasing a task

                                                                              -

                                                                            4. After the task is released, you can view its status. The developer's modification is synchronized to the production environment.

                                                                              Figure 2 Viewing the task status
                                                                              +

                                                                            5. After the task is released, you can view its status. The developer's modification is synchronized to the production environment.

                                                                              Figure 2 Viewing the task status

                                                                            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5104.html b/docs/dataartsstudio/umn/dataartsstudio_01_5104.html index 01d40640f..22cab6bac 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_5104.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5104.html @@ -30,7 +30,7 @@ - - + + + + + + + + + + @@ -27,7 +45,7 @@

                                                                            Use Constraints

                                                                            Before using DataArts Studio, you must read and understand the following restrictions: -
                                                                            Table 1 Permissions of different roles

                                                                            Role

                                                                            The preparations include preparing data lakes and preparing and synchronizing data.

                                                                            Preparing data lakes:

                                                                            -
                                                                            In enterprise mode, the development environment and production environment need to be isolated. Therefore, you need to prepare two data lake services, one for the production environment and the other for the development environment.
                                                                            • For clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, DIS, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two data lake services (clusters) that have the same version, specifications, components, region, VPC, subnet, and other related configurations.

                                                                              For example, if your data lake service is an MRS cluster, you need to prepare two MRS clusters with the same version, specifications, components, region, VPC, and subnet. Any change to the configuration of one of the MRS clusters must be synchronized to the other cluster.

                                                                              +
                                                                              In enterprise mode, the development environment and production environment need to be isolated. Therefore, you need to prepare two data lake services, one for the production environment and the other for the development environment.
                                                                              • For clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two data lake services (clusters) that have the same version, specifications, components, region, VPC, subnet, and other related configurations.

                                                                                For example, if your data lake service is an MRS cluster, you need to prepare two MRS clusters with the same version, specifications, components, region, VPC, and subnet. Any change to the configuration of one of the MRS clusters must be synchronized to the other cluster.

                                                                              • For serverless services (such as DLI), you can configure the mapping between data lake services in the production environment and those in the development environment through environment isolation in Management Center. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of queue and database resources in the serverless data lake service. You are advised to distinguish them by name suffix.
                                                                              • If GaussDB(DWS), MRS Hive, and MRS Spark data sources use the same cluster, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments.

                                                                              Preparing and synchronizing data:

                                                                              -
                                                                              • After creating data lake services, you must create databases, database schemas (required only for DWS), and data tables in the data lake services of the development and production environments based on the project plan (for example, the databases and tables required for data development).
                                                                                • For clustered data sources (such as MRS, DWS, RDS, MySQL, Oracle, DIS and ECS), use two clusters, one for the development environment and the other for the production environment. The names of the databases, database schemas (required only for DWS), and data tables in the two environments must be the same.
                                                                                • For serverless services (such as DLI), you are advised to associate and distinguish the two queues and databases by name suffix (add suffix _dev to the names of the queues and databases in the development environment and add no suffix to those in the production environment). The names of data tables in the development environment must be the same as those in the production environment.
                                                                                • For DWS, MRS Hive, and MRS Spark data sources that use the same cluster, use two databases to isolate the development and production environments (add suffix _dev to the database for the development environment and add no suffix to the database for the production environment). The names of database schemas (required only for DWS) and data tables in the development environment must be the same as those in the production environment.
                                                                                +
                                                                                • After creating data lake services, you must create databases, database schemas (required only for DWS), and data tables in the data lake services of the development and production environments based on the project plan (for example, the databases and tables required for data development).
                                                                                  • For clustered data sources (such as MRS, DWS, RDS, MySQL, Oracle, and ECS), use two clusters, one for the development environment and the other for the production environment. The names of the databases, database schemas (required only for DWS), and data tables in the two environments must be the same.
                                                                                  • For serverless services (such as DLI), you are advised to associate and distinguish the two queues and databases by name suffix (add suffix _dev to the names of the queues and databases in the development environment and add no suffix to those in the production environment). The names of data tables in the development environment must be the same as those in the production environment.
                                                                                  • For DWS, MRS Hive, and MRS Spark data sources that use the same cluster, use two databases to isolate the development and production environments (add suffix _dev to the database for the development environment and add no suffix to the database for the production environment). The names of database schemas (required only for DWS) and data tables in the development environment must be the same as those in the production environment.
                                                                                • After creating databases, database schemas (required only for DWS), and data tables, you must synchronize data of existing tables (if any) between the two data lake services.
                                                                                  • Existing data in data lakes: Use data migration services such as CDM and DRS to synchronize data in batches between data lakes.
                                                                                  • Data to be migrated from the data source: Use peering jobs of data migration services such as CDM and DRS to synchronize data between the data lake service of the production environment and that of the development environment.

                                                                            You must create data connections for all data lake engines.

                                                                            For clustered data sources that use different clusters, you can create a data connection between DataArts Studio and the data lake of the development environment and a data connection between DataArts Studio and the data lake of the production environment at the same time.

                                                                            -

                                                                            For details, see Creating a Data Connection.

                                                                            +

                                                                            For details, see Creating a DataArts Studio Data Connection.

                                                                            Configuring environment isolation for a workspace in enterprise mode

                                                                            Configure DLI queue and DB mapping to isolate the development and production environments.

                                                                            For the DWS, MRS Hive, and MRS Spark data sources, if you select the same cluster when creating a data connection, you need to configure two databases for the same data lake service to isolate the development environment from the production environment. For details, see DB Configuration.

                                                                            -

                                                                            For the DLI data source, you can configure two DLI queues and databases to isolate the production environment from the development environment. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.

                                                                            +

                                                                            For the DLI data source, you can configure two DLI queues and databases to isolate the production environment from the development environment. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.

                                                                            Creating IAM users and assigning DataArts Studio permissions

                                                                            +

                                                                            Creating an IAM user and assigning DataArts Studio permissions to the user

                                                                            Create IAM accounts with the DARTS User permission for project members who use DataArts Studio.

                                                                            -

                                                                            For details, see "Creating an IAM User and Assigning DataArts Studio Permissions" in "Preparations".

                                                                            -

                                                                            Adding workspace members and assigning roles

                                                                            -

                                                                            Assign workspace roles to the IAM accounts of the project members. Six types of roles are available: admin, developer, deployer, operator, viewer, and custom role.

                                                                            -

                                                                            For details, see "Adding a Member and Assigning a Role" in "Preparations".

                                                                            +

                                                                            Create an IAM user with the DARTS User permissions for a project member who wants to use DataArts Studio and assign a workspace role to the created user.

                                                                            +

                                                                            For details, see Authorizing Users to Use DataArts Studio.

                                                                            Notification management

                                                                            Configure notifications to be sent when a job is abnormal or runs successfully.

                                                                            -

                                                                            For details, see Managing Notifications.

                                                                            +

                                                                            For details, see Notification Management.

                                                                            Backup management

                                                                            @@ -45,7 +45,7 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5105.html b/docs/dataartsstudio/umn/dataartsstudio_01_5105.html index a2336b2ea..d15b231e1 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_5105.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5105.html @@ -1,23 +1,23 @@ -

                                                                            Configuring Environment Isolation for a Workspace in Enterprise Mode

                                                                            +

                                                                            Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode

                                                                            • You can configure isolation between the development and production environments for DLI and DB.
                                                                            • After the environment isolation is configured, the data connection in the development environment in the script or job during data development is automatically switched to the data connection in the production environment after the process is released.

                                                                            Prerequisites

                                                                            • Before configuring environment isolation for DLI, ensure that you have created a DLI data connection.

                                                                            (Optional) Configuring DLI Environment Isolation

                                                                            Environment isolation needs to be configured only for a serverless service (that is, DLI).

                                                                            -
                                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                            2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                                            3. In the left navigation pane on the Management Center page, choose Data Source Resource Mapping Configuration.
                                                                              Figure 1 Data Source Resource Mapping Configuration
                                                                              +
                                                                              1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                              2. On the DataArts Studio console, locate a workspace and click Management Center.
                                                                              3. In the left navigation pane on the Management Center page, choose Data Source Resource Mapping Configuration.
                                                                                Figure 1 Data Source Resource Mapping Configuration

                                                                                -
                                                                              4. Click the DB Configuration tab and then Add. Set the database names for the development and production environments respectively and click Save. You can click and to edit and delete records.
                                                                                The database names must be the names of created databases. It is recommended that the database name for the development environment be the same as that for the production environment, and that suffix _dev be added to the database name for the development environment so that it can be distinguished from the database name for the production environment.
                                                                                Figure 2 DB Configuration
                                                                                +
                                                                              5. Click the DB Configuration tab and then Add. Set the database names for the development and production environments respectively and click Save. You can click and to edit and delete records.
                                                                                The database names must be the names of created databases. It is recommended that the database name for the development environment be the same as that for the production environment, and that suffix _dev be added to the database name for the development environment so that it can be distinguished from the database name for the production environment.
                                                                                Figure 2 DB Configuration

                                                                                -
                                                                              6. Click the DLI Queue Configuration tab and then Add. Set the queue names for the development and production environments respectively and click Save. You can use and to edit and delete records.
                                                                                The queue names must be the names of created DLI queues. It is recommended that the queue name for the development environment be the same as that for the production environment, and that suffix _dev be added to the queue name for the development environment so that it can be distinguished from the queue name for the production environment.
                                                                                Figure 3 DLI Queue Configuration
                                                                                +
                                                                              7. Click the DLI Queue Configuration tab and then Add. Set the queue names for the development and production environments respectively and click Save. You can use and to edit and delete records.
                                                                                The queue names must be the names of created DLI queues. It is recommended that the queue name for the development environment be the same as that for the production environment, and that suffix _dev be added to the queue name for the development environment so that it can be distinguished from the queue name for the production environment.
                                                                                Figure 3 DLI Queue Configuration

                                                                              8. After the preceding operations are complete, DLI environment isolation configuration is complete.
                                                                            -

                                                                            DB Configuration

                                                                            1. On the DataArts Studio console, locate a workspace and click Management Center.
                                                                            2. In the left navigation pane on the Management Center page, choose Data Source Resource Mapping Configuration.
                                                                            3. Click the DB Configuration tab and then Add. Set the database names for the development and production environments respectively and click Save. You can click and to edit and delete records.
                                                                              The database names must be the names of created databases. It is recommended that the database name for the development environment be the same as that for the production environment, and that suffix _dev be added to the database name for the development environment so that it can be distinguished from the database name for the production environment.

                                                                              For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments.

                                                                              +

                                                                              DB Configuration

                                                                              1. On the DataArts Studio console, locate a workspace and click Management Center.
                                                                              2. In the left navigation pane on the Management Center page, choose Data Source Resource Mapping Configuration.
                                                                              3. Click the DB Configuration tab and then Add. Set the database names for the development and production environments respectively and click Save. You can click and to edit and delete records.
                                                                                The database names must be the names of created databases. It is recommended that the database name for the development environment be the same as that for the production environment, and that suffix _dev be added to the database name for the development environment so that it can be distinguished from the database name for the production environment.

                                                                                For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection, you must configure database mapping on the Configure Data Source Resource Mapping page to isolate the development and production environments.

                                                                                -
                                                                                Figure 4 DB Configuration
                                                                                +
                                                                                Figure 4 DB Configuration

                                                                              @@ -29,3 +29,10 @@
                                                                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5106.html b/docs/dataartsstudio/umn/dataartsstudio_01_5106.html new file mode 100644 index 000000000..f199780a9 --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5106.html @@ -0,0 +1,24 @@ + + +

                                                                              Operations Supported for Different Roles in Enterprise Mode

                                                                              +

                                                                              +
                                                                              + + diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_5135.html b/docs/dataartsstudio/umn/dataartsstudio_01_5135.html index 87b8fbb2b..314248424 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_5135.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_5135.html @@ -2,42 +2,42 @@

                                                                              Creating a Workspace in Enterprise Mode

                                                                              If you are using a workspace in simple mode and want to isolate the development and production environments, you can upgrade the workspace to one in enterprise mode. If you have not used any workspace in simple mode and do not need to inherit data, you can directly create a workspace in enterprise mode by following the instructions in this section.

                                                                              -

                                                                              Restrictions

                                                                              You can upgrade your workspace mode or create a workspace in enterprise mode only if you are assigned the DARTS Administrator or Tenant Administrator role.

                                                                              +

                                                                              Restrictions

                                                                              You can upgrade your workspace mode or create a workspace in enterprise mode only if you are assigned the DARTS Administrator or Tenant Administrator role.

                                                                              Prerequisites

                                                                              Before creating a workspace, ensure that:

                                                                              -
                                                                              • You have understood the differences between workspaces in simple mode and those in enterprise mode, such as the differences in the development process. For details, see Introduction to the Simple Mode and Enterprise Mode.
                                                                              • You have configured workspace-level scheduling identities, including public agencies and public IAM accounts. For details, see Configuring a Public Agency and Configuring a Public IAM Account.
                                                                              • You have prepared two sets of isolated data lake engines, one for the development environment and the other for the production environment.
                                                                                • Configure two sets of data lake services to isolate the development environment from the production environment.

                                                                                  For clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, DIS, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services that have the same version, specifications, components, region, VPC, subnet, and other related configurations. For details, see Creating a Data Connection.

                                                                                  +
                                                                                  • You have understood the differences between workspaces in simple mode and those in enterprise mode, such as the differences in the development process. For details, see Introduction to the Simple Mode and Enterprise Mode.
                                                                                  • You have configured workspace-level scheduling identities, including public agencies and public IAM accounts. For details, see Configuring a Public Agency and Configuring a Public IAM Account.
                                                                                  • You have prepared two sets of isolated data lake engines, one for the development environment and the other for the production environment.
                                                                                    • Configure two sets of data lake services to isolate the development environment from the production environment.

                                                                                      For clustered data sources, such as MRS, GaussDB(DWS), RDS, MySQL, Oracle, and ECS, you can create data connections in Management Center to distinguish data lake services in the development environment from those in the production environment. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of data lake services that have the same version, specifications, components, region, VPC, subnet, and other related configurations. For details, see Creating a DataArts Studio Data Connection.

                                                                                      When creating a data connection, you can select different clusters for the development environment and production environment to isolate them.

                                                                                      -
                                                                                      Figure 1 Selecting different clusters during data connection creation
                                                                                      +
                                                                                      Figure 1 Selecting different clusters during data connection creation

                                                                                    • Configure environment isolation for DLI.

                                                                                      Configure environment isolation in enterprise mode, including DLI queue configuration and DB configuration.

                                                                                      -

                                                                                      For serverless services (such as DLI), you can configure the mapping between data lake services in the production environment and those in the development environment through environment isolation in Management Center. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.

                                                                                      +

                                                                                      For serverless services (such as DLI), you can configure the mapping between data lake services in the production environment and those in the development environment through environment isolation in Management Center. The data lake is automatically switched during development and production. Therefore, you need to prepare two sets of queues and database resources in the serverless data lake service and distinguish them by name suffix. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.

                                                                                    • Configure two databases in the same data lake service to isolate the development environment from the production environment.

                                                                                      For GaussDB(DWS), MRS Hive, and MRS Spark, if you select the same cluster when creating a data connection (as shown in Figure 2), you must configure database mapping on the Configure Data Source Resource Mapping page shown in Figure 3 to isolate the development and production environments. For details, see DB configuration.

                                                                                      -
                                                                                      Figure 2 Selecting the same cluster during data connection creation
                                                                                      +
                                                                                      Figure 2 Selecting the same cluster during data connection creation

                                                                                      -
                                                                                      Figure 3 DB Configuration
                                                                                      +
                                                                                      Figure 3 DB Configuration

                                                                                    -
                                                                                  • Prepare and synchronize data.
                                                                                    • After creating data lake services, you must create databases, database schemas (required only for DWS), and data tables in the data lake services of the development and production environments based on the project plan (for example, the databases and tables required for data development).
                                                                                      • For clustered data sources (such as MRS, DWS, RDS, MySQL, Oracle, DIS and ECS), use two clusters, one for the development environment and the other for the production environment. The names of the databases, database schemas (required only for DWS), and data tables in the two environments must be the same.
                                                                                      • For serverless services (such as DLI), you are advised to associate and distinguish the two queues and databases by name suffix (add suffix _dev to the names of the queues and databases in the development environment and add no suffix to those in the production environment). The names of data tables in the development environment must be the same as those in the production environment.
                                                                                      • For DWS, MRS Hive, and MRS Spark data sources, if the same cluster is used for the development and production environments, use two databases to isolate the development and production environments (add suffix _dev to the database for the development environment and add no suffix to the database for the production environment). The names of database schemas (required only for DWS) and data tables in the development environment must be the same as those in the production environment.
                                                                                      +
                                                                                    • Prepare and synchronize data.
                                                                                      • After creating data lake services, you must create databases, database schemas (required only for DWS), and data tables in the data lake services of the development and production environments based on the project plan (for example, the databases and tables required for data development).
                                                                                        • For clustered data sources (such as MRS, DWS, RDS, MySQL, Oracle, and ECS), use two clusters, one for the development environment and the other for the production environment. The names of the databases, database schemas (required only for DWS), and data tables in the two environments must be the same.
                                                                                        • For serverless services (such as DLI), you are advised to associate and distinguish the two queues and databases by name suffix (add suffix _dev to the names of the queues and databases in the development environment and add no suffix to those in the production environment). The names of data tables in the development environment must be the same as those in the production environment.
                                                                                        • For DWS, MRS Hive, and MRS Spark data sources, if the same cluster is used for the development and production environments, use two databases to isolate the development and production environments (add suffix _dev to the database for the development environment and add no suffix to the database for the production environment). The names of database schemas (required only for DWS) and data tables in the development environment must be the same as those in the production environment.
                                                                                      • After creating databases, database schemas (required only for DWS), and data tables, you must synchronize data of existing tables (if any) between the two data lake services.
                                                                                        • Existing data in data lakes: Use data migration services such as CDM and DRS to synchronize data in batches between data lakes.
                                                                                        • Data to be migrated from the data source: Use peering jobs of data migration services such as CDM and DRS to synchronize data between the data lake service of the production environment and that of the development environment.

                                                                              Change Description

                                                                              After the workspace mode is upgraded, a development environment isolated from the production environment is added.

                                                                              -

                                                                              Upgrading the Simple Mode to Enterprise Mode

                                                                              With the DARTS Administrator or Tenant Administrator role, you can upgrade a workspace in simple mode to one in enterprise mode.

                                                                              +

                                                                              Upgrading the Simple Mode to Enterprise Mode

                                                                              With the DARTS Administrator or Tenant Administrator role, you can upgrade a workspace in simple mode to one in enterprise mode.

                                                                              • Pre-upgrade operations

                                                                                Configure a workspace-level public agency or public IAM account in DataArts Factory to avoid an upgrade failure.

                                                                                For details about how to configure an agency, see Configuring a Scheduling Identity.

                                                                                -
                                                                                Figure 4 Configuring a workspace-level agency
                                                                                +
                                                                                Figure 4 Configuring a workspace-level agency

                                                                                -
                                                                              • Upgrade operations
                                                                                1. Log in to the DataArts Studio console.
                                                                                2. Locate a DataArts Studio instance and click Access. Then, click the Workspaces tab.
                                                                                3. Locate the workspace you want to upgrade and click Edit in Operation column.
                                                                                4. In the displayed Workspace Information dialog box, click Upgrade next to the Mode text box. In the displayed dialog box, click Upgrade.
                                                                                  Figure 5 Upgrading to the enterprise mode
                                                                                  +
                                                                                5. Upgrade operations
                                                                                  1. Log in to the DataArts Studio console.
                                                                                  2. Locate a DataArts Studio instance and click Access. Then, click the Workspaces tab.
                                                                                  3. Locate the workspace you want to upgrade and click Edit in Operation column.
                                                                                  4. In the displayed Workspace Information dialog box, click Upgrade next to the Mode text box. In the displayed dialog box, click Upgrade.
                                                                                    Figure 5 Upgrading to the enterprise mode

                                                                                6. Post-upgrade operations

                                                                                  After the upgrade is complete, you (as the admin) need to modify data connections, configure environment isolation, and define roles such as the admin, developer, deployer, and operator in the workspace.

                                                                                  -
                                                                                  1. Modify data connections. For details, see Creating a Data Connection.
                                                                                  2. Configure environment isolation. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.
                                                                                  3. Define workspace roles for other users: For details, see "Adding a Member and Assigning a Role" in "Preparations".
                                                                                  +
                                                                                  1. Modify data connections. For details, see Creating a DataArts Studio Data Connection.
                                                                                  2. Configure environment isolation. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.
                                                                                  3. Define workspace roles for other users. For details, see Adding Workspace Members and Assigning Roles.

                                                                              Creating a Workspace in Enterprise Mode

                                                                              If you have not used the simple mode before and do not need to inherit business data, you can directly create a workspace in enterprise mode.

                                                                              -
                                                                              • Create a workspace.
                                                                                1. Log in to the DataArts Studio console using an account with the DARTS Administrator or Tenant Administrator permission.
                                                                                2. Locate an instance and click Access. Then click the Workspaces tab.
                                                                                3. Click Create. In the displayed Create dialog box, set parameters based on Table 1 and click OK.

                                                                                  +
                                                                                  • Create a workspace.
                                                                                    1. Log in to the DataArts Studio console using an account with the DARTS Administrator or Tenant Administrator permission.
                                                                                    2. Locate an instance and click Access. Then click the Workspaces tab.
                                                                                    3. Click Create. In the displayed Create dialog box, set parameters based on Table 1 and click OK.

                                                                                      @@ -62,15 +62,19 @@ -
                                                                                      Table 1 Parameters for creating a workspace

                                                                                      Parameter

                                                                                      Enterprise Project

                                                                                      Enterprise project associated with the default workspace of the DataArts Studio instance.

                                                                                      -
                                                                                      This parameter is available only when an enterprise project has been created. If you want to connect the DataArts Studio instance to a cloud service (such as DWS, MRS, and RDS), ensure that the enterprise project of the DataArts Studio workspace is the same as that of the cloud service instance.
                                                                                      • You can create only one DataArts Studio instance for an enterprise project.
                                                                                      • If you want to enable communication between DataArts Studio and another cloud service, ensure that the enterprise project of DataArts Studio is the same as that of the cloud service.
                                                                                      +

                                                                                      Enterprise project associated with the default workspace of the DataArts Studio instance.

                                                                                      +
                                                                                      This parameter is available only when an enterprise project has been created. If you want to connect the DataArts Studio instance to an instance of another cloud service, such as GaussDB(DWS), MRS, and RDS, ensure that the enterprise project of the DataArts Studio instance's workspace is the same as that of the target cloud service instance.
                                                                                      • You can create only one DataArts Studio instance for an enterprise project.
                                                                                      • If you want to enable communication between DataArts Studio and another cloud service, ensure that the enterprise project of DataArts Studio is the same as that of the target cloud service.
                                                                                      +
                                                                                      NOTE:

                                                                                      If the enterprise project function is not enabled, only one DataArts Studio instance can be created for each IAM project.

                                                                                      +

                                                                                      Job Log Path

                                                                                      OBS bucket for storing the job logs of DataArts Factory of DataArts Studio. To use the DataArts Factory module of DataArts Studio, workspace members must have the read and write permissions on the OBS bucket for storing job logs. Otherwise, the system cannot read or write job logs of DataArts Factory.

                                                                                      -
                                                                                      • Click Select. You can select an existing OBS bucket. The selected OBS bucket is globally configured in the current workspace.
                                                                                      • If you do not set this parameter, job logs of DataArts Factory are stored in the OBS bucket named dlf-log-{projectId} by default.
                                                                                      +
                                                                                      • Click Select. You can select an existing OBS bucket. The selected OBS bucket is globally configured in the current workspace.
                                                                                      • If you do not set this parameter, job logs of DataArts Factory are stored in the OBS bucket named dlf-log-{projectId} by default.
                                                                                        NOTE:

                                                                                        The execution logs of data development jobs are stored in xxxxx.log format in an OBS bucket. xxxxx indicates the job ID. Deleting the historical records of SQL statements that have been executed does not affect services.

                                                                                        +
                                                                                        +

                                                                                      Dirty Data Path

                                                                                      @@ -84,7 +88,7 @@
                                                                                    4. Perform follow-up operations.

                                                                                      After creating the workspace, you (as the admin) need to create data connections, configure environment isolation, and define roles such as the admin, developer, deployer, and operator in the workspace.

                                                                                      -
                                                                                      1. Create data connections. For details, see Creating a Data Connection.
                                                                                      2. Configure environment isolation. For details, see Configuring Environment Isolation for a Workspace in Enterprise Mode.
                                                                                      3. Define workspace roles for other users: For details, see "Adding a Member and Assigning a Role" in "Preparations".
                                                                                      4. Configure a workspace-level public agency or public IAM account in DataArts Factory. For details about how to configure an agency, see Configuring a Scheduling Identity.
                                                                                        Figure 6 Configuring a workspace-level agency
                                                                                        +
                                                                                        1. Create data connections. For details, see Creating a DataArts Studio Data Connection.
                                                                                        2. Configure environment isolation. For details, see Configuring Environment Isolation for a DataArts Studio Workspace in Enterprise Mode.
                                                                                        3. Define workspace roles for other users. For details, see Adding Workspace Members and Assigning Roles.
                                                                                        4. Configure a workspace-level public agency or public IAM account in DataArts Factory. For details about how to configure an agency, see Configuring a Scheduling Identity.
                                                                                          Figure 6 Configuring a workspace-level agency

                                                                                      5. @@ -92,7 +96,14 @@ + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_7523.html b/docs/dataartsstudio/umn/dataartsstudio_01_7523.html index 20455a556..799f93dad 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_7523.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_7523.html @@ -30,21 +30,22 @@

                                                                                        Method 1

                                                                                        In DataArts Studio, create a job that is scheduled every day and add an empty Dummy node (which does not process data) to the job. You can set a condition expression on the connection line between the Dummy node and its subsequent node to check whether the current day is the last day of the current month. If it is the last day, the subsequent nodes are executed. Otherwise, the subsequent nodes are skipped.

                                                                                        -
                                                                                        1. In the left navigation pane of the DataArts Factory console, choose Data Development > Develop Job.
                                                                                        2. Set Scheduling Frequency to Every day.
                                                                                          Figure 1 Setting Scheduling Frequency to Every day
                                                                                          +
                                                                                          1. In the left navigation pane of the DataArts Factory console, choose Data Development > Develop Job.
                                                                                          2. Set Scheduling Frequency to Every day.
                                                                                            Figure 1 Setting Scheduling Frequency to Every day

                                                                                            -
                                                                                          3. Right-click the connection line between the Dummy node and its subsequent node and select Set Condition to configure a condition expression that is used to determine whether to execute the subsequent node.
                                                                                            Figure 2 Configuring a condition expression
                                                                                            +
                                                                                          4. Right-click the connection line between the Dummy node and its subsequent node and select Set Condition to configure a condition expression that is used to determine whether to execute the subsequent node.
                                                                                            Figure 2 Configuring a condition expression

                                                                                          5. Configure the expression as follows:
                                                                                            #{DateUtil.getDay(DateUtil.addDays(Job.planTime,1)) == 1 ? "true" : "false"}

                                                                                            The expression is used to obtain the current time and check whether the next day is 1st of a month. If yes, the current day is the last day of the current month, and the subsequent node will be executed; if no, the subsequent node will be skipped.

                                                                                            -
                                                                                            Figure 3 Condition expression
                                                                                            +
                                                                                            Figure 3 Condition expression

                                                                                            -

                                                                                            For example, if you want a job to be executed on the last day and seventh day of each month, perform the following operation:

                                                                                            +

                                                                                            For example, if you want a job to be executed on the last day of each month, perform the above operations.

                                                                                            +

                                                                                            For example, if you want a job to be executed on the seventh day of each month, perform the following operations:

                                                                                            Configure the following expression to check whether the current day is 7th:

                                                                                            #{DateUtil.getDay(Job.planTime) == 7 ? "true" : "false"}
                                                                                        -

                                                                                        Method 2

                                                                                        1. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                                        2. Click Scheduling Setup on the right of the job canvas.
                                                                                        3. Set Scheduling Type to Run periodically, Scheduling Frequency to Every month, and Select Time to the last day of each month.
                                                                                          Figure 4 Setting the scheduling time to the last day of each month
                                                                                          +

                                                                                          Method 2

                                                                                          1. In the left navigation pane of DataArts Factory, choose Development > Develop Job.
                                                                                          2. Click Scheduling Setup on the right of the job canvas.
                                                                                          3. Set Scheduling Type to Run periodically, Scheduling Frequency to Every month, and Select Time to the last day of each month.
                                                                                            Figure 4 Setting the scheduling time to the last day of each month

                                                                                            After the scheduling time is configured, the job will be automatically executed on the last day of each month.

                                                                                          @@ -56,3 +57,10 @@
                                                                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_7524.html b/docs/dataartsstudio/umn/dataartsstudio_01_7524.html index 8c31a7024..9aa4fb086 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_7524.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_7524.html @@ -2,64 +2,50 @@

                                                                                        Referencing Parameters in Scripts and Jobs

                                                                                        This section describes how to reference parameters in scripts and jobs, application scope of the referenced parameters, and whether EL expressions and simple variable sets are supported, helping you better understand how to use workspace-level, script-level, and job-level parameters.

                                                                                        -

                                                                                        Parameters can be set in environment variables, job parameters, and script parameters, but their application scopes are different. If there is a conflict when parameters in environment variables, job parameters, and script parameters of the same name, the calling priority is: job parameters > environment variables > script parameters.

                                                                                        +

                                                                                        The application scopes of workspace environment variables, job parameters, and script parameters are different. If a workspace environment variable, a job parameter, and a script parameter have the same name, their priorities are as follows: job parameter > workspace environment variable > script parameter.

                                                                                        -
                                                                                        Table 1 Methods of using parameters

                                                                                        Type

                                                                                        +
                                                                                        - - - - - - - - - - - - - - - - - - -
                                                                                        Table 1 Methods of using parameters

                                                                                        Type

                                                                                        Scenario

                                                                                        +

                                                                                        Scenario

                                                                                        Scope

                                                                                        +

                                                                                        Scope

                                                                                        Calling Method

                                                                                        -

                                                                                        Example

                                                                                        +

                                                                                        Calling Method

                                                                                        Environment variables/constants

                                                                                        +

                                                                                        Environment variables/constants

                                                                                        When configuring job parameters, you can extract a parameter that belongs to multiple jobs as an environment variable.

                                                                                        +

                                                                                        When configuring job parameters, you can extract a parameter that belongs to multiple jobs as an environment variable.

                                                                                        Current workspace

                                                                                        +

                                                                                        Current workspace

                                                                                        ${Environment variable}

                                                                                        +

                                                                                        ${Environment variable}

                                                                                        ${Environment constant}

                                                                                        For details about the configuration method, see Environment Variable.

                                                                                        EL expression: #{DateUtil.getDay(Job.planTime)}

                                                                                        -

                                                                                        Simple variable set: ${yyyymmdd±N}

                                                                                        -

                                                                                        Job variables/constants

                                                                                        +

                                                                                        Job variables/constants

                                                                                        Job parameters can be used in any node in jobs.

                                                                                        +

                                                                                        Job parameters can be used in any node in jobs.

                                                                                        Current job

                                                                                        +

                                                                                        Current job

                                                                                        ${Job variable}

                                                                                        +

                                                                                        ${Job variable}

                                                                                        ${Job constant}

                                                                                        For details about the configuration method, see Configuring Job Parameters.

                                                                                        EL expression: #{DateUtil.now()}

                                                                                        -

                                                                                        Simple variable set: ${yyyymm±N}

                                                                                        -

                                                                                        Script parameters

                                                                                        +

                                                                                        Script parameters

                                                                                        Set the name and value of a custom field.

                                                                                        +

                                                                                        Set the name and value of a custom field.

                                                                                        Current script

                                                                                        +

                                                                                        Current script

                                                                                        ${Script parameter}

                                                                                        +

                                                                                        ${Script parameter}

                                                                                        For details about the configuration method, see Script Parameter.

                                                                                        Example script parameters:

                                                                                        -

                                                                                        ${time}

                                                                                        -

                                                                                        ${yyyymmddhh24miss}

                                                                                        -

                                                                                        ${job_id}

                                                                                        -

                                                                                        ${instance_id}

                                                                                        -
                                                                                        @@ -68,36 +54,36 @@

                                                                                        The default variable format is ${}.

                                                                                        Environment Variable

                                                                                        Variables and constants can be defined in environment variables. Environment variables take effect in current workspace.
                                                                                        • The value of a variable (such as workspace name) varies depending on the workspace. When exporting a variable from a workspace and import it to another workspace, you must reconfigure its value.
                                                                                        • The value of a constant in different workspaces is the same. When importing a constant to another workspace, you do not need to reconfigure its value.
                                                                                        -
                                                                                        Figure 1 Environment Variable
                                                                                        +
                                                                                        Figure 1 Environment Variable

                                                                                        The specific application is as follows:

                                                                                        -

                                                                                        An environment variable has been added. The parameter name is sdqw and the parameter value is wqewqewqe.

                                                                                        -
                                                                                        1. Open a created job and drag a Create OBS node from the node library to the canvas.
                                                                                        2. On the Node Properties tab page, configure the node properties.

                                                                                          Figure 2 Create OBS
                                                                                          +

                                                                                          An environment variable has been added. The parameter name is sdqw and the parameter value is wqewqewqe.

                                                                                          +
                                                                                          1. Open a created job and drag a Create OBS node from the node library to the canvas.
                                                                                          2. On the Node Properties tab page, configure the node properties.

                                                                                            Figure 2 Create OBS

                                                                                          3. Click Save and then Monitor to monitor the running status of the job.
                                                                                        -

                                                                                        Configuring Job Parameters

                                                                                        Parameters and constants can be defined in job parameters. Job parameters take effect in current job.
                                                                                        • The value of a parameter varies depending on the job. You need to reconfigure the parameter.
                                                                                        • The value of a constant in different jobs is the same. When importing a constant to another job, you do not need to reconfigure its value.
                                                                                          Figure 3 Job parameter.
                                                                                          +

                                                                                          Configuring Job Parameters

                                                                                          Variables and constants can be defined in job parameters. Job parameters take effect in the current job.
                                                                                          • The value of a variable varies depending on the job. You need to configure a value for the variable in each job.
                                                                                          • The value of a constant in different jobs is the same. When importing a constant to another job, you do not need to reconfigure its value.
                                                                                            Figure 3 Job parameter.

                                                                                            After a job parameter is defined, it can be referenced by a job node.

                                                                                            -
                                                                                            Figure 4 Using a Job Parameter Configuration
                                                                                            +
                                                                                            Figure 4 Using a Job Parameter Configuration

                                                                                          -

                                                                                          Script Parameter

                                                                                          • Script parameters take effect in current script and it can be used in the following ways.
                                                                                            • For SQL scripts, you can directly enter parameters in the script editor (not supported for Flink SQL scripts). During job scheduling, you can assign values to parameters through node attributes, as shown in 2.
                                                                                            • For Shell scripts, you can enter a parameter and an interactive parameter in the upper part of the editor to transfer the parameters.
                                                                                            • Python scripts support parameter transfer.
                                                                                            • For SQL scripts, you can directly enter parameters in the script editor (not supported for Flink SQL scripts). When executing a script independently, you can configure parameters in the lower part of the editor shown in Figure 5.
                                                                                              Figure 5 Configuring script parameters when executing a script independently
                                                                                              +

                                                                                              Script Parameter

                                                                                              • Script parameters take effect in current script and it can be used in the following ways.
                                                                                                • For SQL scripts, you can directly enter parameters in the script editor (not supported for Flink SQL scripts). During job scheduling, you can assign values to parameters through node attributes, as shown in 2.
                                                                                                • For Shell scripts, you can enter a parameter and an interactive parameter in the upper part of the editor to transfer the parameters.
                                                                                                • Python scripts support parameter transfer.
                                                                                                • For SQL scripts, you can directly enter parameters in the script editor (not supported for Flink SQL scripts). When executing a script independently, you can configure parameters in the lower part of the editor shown in Figure 5.
                                                                                                  Figure 5 Configuring script parameters when executing a script independently

                                                                                              1. Developing a Python Script During script development, the script expression must contain variables. For example, if the variable in the SQL statement is DATE, set this parameter to ${DATE} in the script. In the job parameter configuration, you can compile the statement expression of the script parameter Date in 2.
                                                                                                On the script development page, enter development statements in the editor, as shown in the following figure.
                                                                                                INSERT INTO B FROM (SELECT * FROM A WHERE DATE = ${DATE})
                                                                                                -
                                                                                                Figure 6 Developing a script
                                                                                                +
                                                                                                Figure 6 Developing a script

                                                                                                After the dws_030903 script is compiled, save and submit the latest version of the script.

                                                                                              2. Develop batch jobs. When developing a job, you need to configure node attribute parameters.

                                                                                                In the left navigation pane of DataArts Factory, choose Data Development > Develop Job.

                                                                                                -
                                                                                                Figure 7 Configuring script parameters when the script is executed by job scheduling
                                                                                                +
                                                                                                Figure 7 Configuring script parameters when the script is executed by job scheduling

                                                                                                -
                                                                                                • If the associated SQL script uses a parameter, the parameter name is displayed (DATA for example). Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.
                                                                                                • If the associated SQL script or script parameters change, you can click to synchronize the changes or click to edit the changes.
                                                                                                • All nodes involving scripts, such as SQL scripts, shell scripts, and Python scripts, can use this method to reference script variables.
                                                                                                +
                                                                                                • If the associated SQL script uses a parameter, the parameter name is displayed (DATA for example). Set the parameter value in the text box next to the parameter name. The parameter value can be an EL expression.
                                                                                                • If the associated SQL script or script parameters change, you can click to synchronize the changes or click to edit the changes.
                                                                                                • All nodes involving scripts, such as SQL scripts, shell scripts, and Python scripts, can use this method to reference script variables.
                                                                                              @@ -110,3 +96,10 @@
                                                                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_7564.html b/docs/dataartsstudio/umn/dataartsstudio_01_7564.html index 605e39478..693a9620a 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_01_7564.html +++ b/docs/dataartsstudio/umn/dataartsstudio_01_7564.html @@ -4,14 +4,14 @@

                                                                                        Scenario

                                                                                        This section describes how to configure a job that is scheduled at a specified time of a year.

                                                                                        Procedure

                                                                                        In DataArts Studio, create a job that is scheduled every month and add an empty Dummy node (which does not process data) to the job. You can set a condition expression on the connection line between the Dummy node and its subsequent node to check whether the current time falls in the specified day (for example, June 29, 2023) for scheduling the job. If yes, the subsequent node is executed. Otherwise, the subsequent node is skipped.

                                                                                        -
                                                                                        1. In the left navigation pane of the DataArts Factory console, choose Data Development > Develop Job.
                                                                                        2. Set Scheduling Frequency to Every month.
                                                                                          Figure 1 Setting Scheduling Frequency to Every month
                                                                                          +
                                                                                          1. In the left navigation pane of the DataArts Factory console, choose Data Development > Develop Job.
                                                                                          2. Set Scheduling Frequency to Every month.
                                                                                            Figure 1 Setting Scheduling Frequency to Every month

                                                                                            -
                                                                                          3. Right-click the connection line between the Dummy node and its subsequent node and select Set Condition to configure a condition expression that is used to determine whether to execute the subsequent node.
                                                                                            Figure 2 Configuring a condition expression
                                                                                            +
                                                                                          4. Right-click the connection line between the Dummy node and its subsequent node and select Set Condition to configure a condition expression that is used to determine whether to execute the subsequent node.
                                                                                            Figure 2 Configuring a condition expression

                                                                                          5. Configure the expression as follows:
                                                                                            #{DateUtil.getMonth(Job.planTime) == 6 ? "true" : "false"}

                                                                                            The expression is used to obtain the current time and check whether it falls in June. If yes, the subsequent node will be executed; if no, the subsequent node will be skipped.

                                                                                            -
                                                                                            Figure 3 Condition expression
                                                                                            +
                                                                                            Figure 3 Condition expression

                                                                                        @@ -22,3 +22,10 @@
                                                                                        + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_01_7587.html b/docs/dataartsstudio/umn/dataartsstudio_01_7587.html new file mode 100644 index 000000000..d2ce93dde --- /dev/null +++ b/docs/dataartsstudio/umn/dataartsstudio_01_7587.html @@ -0,0 +1,26 @@ + + +

                                                                                        Associating a Real-Time Migration Resource Group with Workspaces

                                                                                        +

                                                                                        Before creating a real-time data migration job, you need to associate the data migration resource group with a DataArts Studio workspace so that you can select a specified computing resource group when creating a real-time data migration job.

                                                                                        +

                                                                                        Prerequisites

                                                                                        You have purchased a resource group. For details, see Buying a DataArts Migration Resource Group Incremental Package.

                                                                                        +
                                                                                        +

                                                                                        Procedure

                                                                                        1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                                        2. Locate an instance and click Access.
                                                                                        3. Click the Resources tab.
                                                                                        4. On the Real-Time Resources page, locate a data migration resource group and click Change Workspace in the Operation column.

                                                                                          Figure 1 Associating a resource group with workspaces
                                                                                          +

                                                                                        5. In the displayed dialog box, search for the DataArts Studio workspace you want to use and click Bind. Then the data migration resource group can be selected in the workspace.

                                                                                          A data migration resource group can be associated with multiple DataArts Studio workspaces.

                                                                                          +
                                                                                          +
                                                                                          Figure 2 Associating a resource group with workspaces
                                                                                          +

                                                                                        +
                                                                                        +
                                                                                        + + + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_03_0001.html b/docs/dataartsstudio/umn/dataartsstudio_03_0001.html index a76e26402..5ee51a500 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_03_0001.html +++ b/docs/dataartsstudio/umn/dataartsstudio_03_0001.html @@ -5,12 +5,12 @@
                                                                                        -
                                                                                        Figure 1 Setting Maximum Concurrent Extractors for a CDM cluster
                                                                                        +
                                                                                        Figure 1 Setting Maximum Concurrent Extractors for a CDM cluster
                                                                                      6. Configure the number of concurrent extractors based on the following rules:
                                                                                        1. When data is to be migrated to files, CDM does not support multiple concurrent tasks. In this case, set a single process to extract data.
                                                                                        2. If each row of the table contains less than or equal to 1 MB data, data can be extracted concurrently. If each row contains more than 1 MB data, it is recommended that data be extracted in a single thread.
                                                                                        3. Set Concurrent Extractors for a job based on Maximum Concurrent Extractors for the cluster. It is recommended that Concurrent Extractors is less than Maximum Concurrent Extractors.
                                                                                        4. If the destination is DLI, you are advised to set the number of concurrent extractors to 1. Otherwise, data may fail to be written.
                                                                                        -
                                                                                        Figure 2 Setting Concurrent Extractors for a job
                                                                                        +
                                                                                        Figure 2 Setting Concurrent Extractors for a job
                                                                                      + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_03_0126.html b/docs/dataartsstudio/umn/dataartsstudio_03_0126.html index 3db2a5384..648e3eeb8 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_03_0126.html +++ b/docs/dataartsstudio/umn/dataartsstudio_03_0126.html @@ -1,7 +1,10 @@

                                                                                      Does DataArts Studio Support Custom Python Scripts?

                                                                                      -

                                                                                      Yes.

                                                                                      +

                                                                                      Symptom

                                                                                      Whether DataArts Studio supports custom Python scripts

                                                                                      +
                                                                                      +

                                                                                      Solution

                                                                                      Yes.

                                                                                      +
                                                                                    5. -
                                                                                      Figure 1 Setting Maximum Concurrent Extractors for a CDM cluster
                                                                                      +
                                                                                      Figure 1 Setting Maximum Concurrent Extractors for a CDM cluster
                                                                                    6. Configure the number of concurrent extractors based on the following rules:
                                                                                      1. When data is to be migrated to files, CDM does not support multiple concurrent tasks. In this case, set a single process to extract data.
                                                                                      2. If each row of the table contains less than or equal to 1 MB data, data can be extracted concurrently. If each row contains more than 1 MB data, it is recommended that data be extracted in a single thread.
                                                                                      3. Set Concurrent Extractors for a job based on Maximum Concurrent Extractors for the cluster. It is recommended that Concurrent Extractors is less than Maximum Concurrent Extractors.
                                                                                      4. If the destination is DLI, you are advised to set the number of concurrent extractors to 1. Otherwise, data may fail to be written.
                                                                                      -
                                                                                      Figure 2 Setting Concurrent Extractors for a job
                                                                                      +
                                                                                      Figure 2 Setting Concurrent Extractors for a job
                                                                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_03_0337.html b/docs/dataartsstudio/umn/dataartsstudio_03_0337.html index 81a73b888..6ee18e05e 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_03_0337.html +++ b/docs/dataartsstudio/umn/dataartsstudio_03_0337.html @@ -1,11 +1,15 @@

                                                                              Does CDM Support Real-Time Migration of Dynamic Data?

                                                                              -

                                                                              No. If data is written to the source during the migration, an error may occur.

                                                                              +

                                                                              Symptom

                                                                              Does CDM support real-time migration of dynamic data?

                                                                              +
                                                                              +

                                                                              Solution

                                                                              No.

                                                                              +

                                                                              If data is written to the source during the migration, an error may occur.

                                                                              +
                                                                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_03_0340.html b/docs/dataartsstudio/umn/dataartsstudio_03_0340.html index 4f1e83b23..a98aa2ea5 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_03_0340.html +++ b/docs/dataartsstudio/umn/dataartsstudio_03_0340.html @@ -1,11 +1,14 @@

                                                                              How Do I Obtain the Current Time Using an Expression?

                                                                              -

                                                                              You can use the DateUtils.format(${timestamp()},"yyyy-MM-dd HH:mm:ss") expression on the Map Field page to obtain the current time.

                                                                              +

                                                                              Symptom

                                                                              How do I obtain the current time using an expression?

                                                                              +
                                                                              +

                                                                              Solution

                                                                              You can use the DateUtils.format(${timestamp()},"yyyy-MM-dd HH:mm:ss") expression on the Map Field page to obtain the current time.

                                                                              +
                                                                              diff --git a/docs/dataartsstudio/umn/dataartsstudio_03_0341.html b/docs/dataartsstudio/umn/dataartsstudio_03_0341.html index 795e790c9..417ceef63 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_03_0341.html +++ b/docs/dataartsstudio/umn/dataartsstudio_03_0341.html @@ -6,13 +6,20 @@

                                                                              Possible Cause

                                                                              By default, tinyInt1isBit is set to true for MySQL databases. As a result, TINYINT(1) is processed as BIT (that is, Types.BOOLEAN), and 1 or 0 is read as true or false.

                                                                              Solution

                                                                              In the advanced attributes of the MySQL link, add either of the following parameters so that tables can be properly created at the destination:

                                                                              -
                                                                              • Parameter tinyInt1isBit, with its value set to false
                                                                              • Parameter mysql.bool.type.transform, with its value set to false
                                                                                Figure 1 Adding link attributes
                                                                                +
                                                                                • Parameter tinyInt1isBit, with its value set to false
                                                                                • Parameter mysql.bool.type.transform, with its value set to false
                                                                                  Figure 1 Adding link attributes
                                                                              + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_03_0400.html b/docs/dataartsstudio/umn/dataartsstudio_03_0400.html index f6ea9cf86..53a2953f9 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_03_0400.html +++ b/docs/dataartsstudio/umn/dataartsstudio_03_0400.html @@ -1,7 +1,10 @@

                                                                              Why Does the Execution of an RDS SQL Statement Fail and an Error Is Reported Indicating That hll Does Not Exist?

                                                                              -

                                                                              By default, the hll plug-in is created in the public schema. The SQL statement must contain the schema to which the hll belongs.

                                                                              +

                                                                              Symptom

                                                                              An RDS SQL statement fails to be executed and an error is reported indicating that hll does not exist.

                                                                              +
                                                                              +

                                                                              Solution

                                                                              By default, the hll plug-in is created in the public schema. The SQL statement must contain the schema to which the hll belongs.

                                                                              +

                                                                            Google Chrome

                                                                            115, 114, and 113

                                                                            +

                                                                            133, 132, or 131

                                                                            Windows 10

                                                                            The resolution ranges from 1366x768 px to 1920x1080 px. 1920x1080 px is the optimal resolution for the best display of the console.

                                                                            +

                                                                            1920x1080 and 2560x1440 are recommended.

                                                                            +

                                                                            Firefox

                                                                            +

                                                                            135 or 134

                                                                            +

                                                                            Windows 10

                                                                            +

                                                                            1920x1080 and 2560x1440 are recommended.

                                                                            +

                                                                            Microsoft Edge

                                                                            +

                                                                            N/A (The version is updated with W10.)

                                                                            +

                                                                            Windows 10

                                                                            +

                                                                            1920x1080 and 2560x1440 are recommended.

                                                                            Table 2 Restrictions for using DataArts Studio

                                                                            Component

                                                                            +
                                                                            @@ -35,12 +53,12 @@ - - @@ -53,31 +71,26 @@ - - - - - - diff --git a/docs/dataartsstudio/umn/dataartsstudio_07_007.html b/docs/dataartsstudio/umn/dataartsstudio_07_007.html index 323e7ddd5..bda9bd97c 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_07_007.html +++ b/docs/dataartsstudio/umn/dataartsstudio_07_007.html @@ -5,9 +5,9 @@

                                                                            CTS

                                                                            DataArts Studio uses Cloud Trace Service (CTS) to audit users' non-query operations on the management console to ensure that no invalid or unauthorized operations have been performed. CTS enhances security.

                                                                            -

                                                                            ECS

                                                                            CDM clusters of DataArts Studio consist of Elastic Cloud Servers (ECSs). In addition, DataArts Studio can use host connections to connect to ECSs and run Shell or Python scripts.

                                                                            +

                                                                            ECS

                                                                            CDM clusters of DataArts Studio consist of Elastic Cloud Servers (ECSs). In addition, DataArts Studio can use host connections to connect to ECSs and run Shell or Python scripts.

                                                                            -

                                                                            VPC

                                                                            Virtual Private Cloud (VPC) provides isolated network environments for DataArts Studio.

                                                                            +

                                                                            VPC

                                                                            Virtual Private Cloud (VPC) provides isolated network environments for DataArts Studio.

                                                                            EIP

                                                                            Elastic IP (EIP) enables DataArts Studio to communicate with the Internet.

                                                                            diff --git a/docs/dataartsstudio/umn/dataartsstudio_07_012.html b/docs/dataartsstudio/umn/dataartsstudio_07_012.html index e239e7143..8762b4aa1 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_07_012.html +++ b/docs/dataartsstudio/umn/dataartsstudio_07_012.html @@ -1,40 +1,40 @@

                                                                            Permission Management

                                                                            -

                                                                            If you need to assign different permissions to employees in your enterprise to access your DataArts Studio resources, IAM is a good choice for fine-grained permissions management. IAM provides identity authentication, permissions management, and access control, helping you secure access to your cloud resources.

                                                                            -

                                                                            With IAM, you can use your cloud account to create IAM users for your employees, and assign permissions to the users to control their access to specific resource types. For example, if you want to allow some software developers in your enterprise to use DataArts Studio resources but disallow them to delete workspaces or perform any high-risk operations, you can create IAM users for the software developers and grant them only the permissions required for using DataArts Studio resources.

                                                                            -

                                                                            DataArts Studio Permissions

                                                                            By default, new IAM users do not have any permissions. To assign permissions to a user, add the user to one or more groups and assign permissions policies or roles to these groups. The user then inherits permissions from the groups it is a member of After authorization, the users can perform specified operations.

                                                                            -

                                                                            DataArts Studio is a project-level service deployed in specific physical regions. To assign ServiceStage permissions to a user group, specify the scope as region-specific projects and select projects for the permissions to take effect. If All projects is selected, the permissions will take effect for the user group in all region-specific projects. When accessing DataArts Studio, users need to switch to a region where they are authorized to use cloud services.

                                                                            -

                                                                            DataArts Studio supports only system role-based authorization and does not support policy-based authorization. To implement fine-grained permission control, DataArts Studio provides the capability of granting permissions to system roles and workspace roles. Specific operation permissions are granted to workspace roles, and workspace roles with different permissions can be customized.

                                                                            -
                                                                            IAM provides the following two authorization mechanisms: Note that DataArts Studio supports only the IAM role-based authorization and does not support the IAM policy-based authorization.
                                                                            • IAM Roles: IAM initially provides a coarse-grained authorization mechanism to define permissions based on users' job responsibilities. This mechanism provides only a limited number of service-level roles for authorization. However, traditional IAM roles are not an ideal choice for fine-grained authorization and secure access control.
                                                                            • IAM Policies: A type of fine-grained authorization mechanism that defines permissions required to perform operations on specific cloud resources under certain conditions. This type of authorization is more flexible and is ideal for least privilege access.
                                                                            +

                                                                            If you need to assign different permissions to employees in your enterprise to access your DataArts Studio resources, IAM is a good choice for fine-grained permissions management. IAM provides identity authentication, permissions management, and access control, helping you secure access to your resources.

                                                                            +

                                                                            With IAM, you can use your account to create IAM users for your employees, and assign permissions to the users to control their access to specific resource types. For example, if you want to allow some software developers in your enterprise to use DataArts Studio resources but disallow them to delete workspaces or perform any high-risk operations, you can create IAM users for the software developers and grant them only the permissions required for using DataArts Studio resources.

                                                                            +

                                                                            DataArts Studio Permissions

                                                                            New IAM users do not have any permissions assigned by default. You need to first add them to one or more groups and then attach policies or roles to these groups. After authorization, the users can perform specified operations.

                                                                            +

                                                                            DataArts Studio is a project-level service deployed in specific physical regions. To assign permissions to a user group, specify the scope as region-specific projects and select projects for the permissions to take effect. If All projects is selected, the permissions will take effect for the user group in all region-specific projects. When accessing DataArts Studio, users need to switch to a region where they are authorized to use cloud services.

                                                                            +

                                                                            DataArts Studio supports only system role-based authorization and does not support policy-based authorization. To implement fine-grained permission control, DataArts Studio provides the capability of granting permissions to system roles and workspace roles. Specific operation permissions are granted to workspace roles, and workspace roles with different permissions can be customized.

                                                                            +
                                                                            IAM provides the following two authorization mechanisms: Note that DataArts Studio supports only the IAM role-based authorization and does not support the IAM policy-based authorization.
                                                                            • IAM Roles: IAM initially provides a coarse-grained authorization mechanism to define permissions based on users' job responsibilities. Only a limited number of service-level roles are available. However, traditional IAM roles are not an ideal choice for fine-grained authorization and secure access control.
                                                                            • IAM Policies: A type of fine-grained authorization mechanism that defines permissions required to perform operations on specific cloud resources under certain conditions. This type of authorization is more flexible and is ideal for least privilege access.
                                                                            -
                                                                            As shown in Figure 1 and Table 1, the system-defined roles supported by DataArts Studio include DARTS Administrator and DARTS User. Workspace roles are based on the DARTS User. Permissions lists the common operations supported by DataArts Studio and the permissions granted to each role. You can select roles as required.
                                                                            Figure 1 Permission system
                                                                            +
                                                                            As shown in Figure 1 and Table 1 and Table 1, the system-defined roles supported by DataArts Studio include DARTS Administrator and DARTS User. Workspace roles are based on the DARTS User. Permissions lists the common operations supported by DataArts Studio and the permissions granted to each role. You can select roles as required.
                                                                            Figure 1 Permission system
                                                                            -
                                                                            Table 2 Restrictions for using DataArts Studio

                                                                            Module

                                                                            Restriction

                                                                            Public

                                                                            1. DataArts Studio is a one-stop platform that provides data integration, development, and governance capabilities. DataArts Studio has no storage or computing capability and relies on the data lake base.
                                                                            2. Only one DataArts Studio instance can be bound to an enterprise project. If an enterprise project already has an instance, no more instance can be added.
                                                                            3. Different components of DataArts Studio support different data sources. You need to select a data lake foundation based on your service requirements. For details about the data lakes supported by DataArts Studio, see "Management Center" > "Data Sources Supported by DataArts Studio" in DataArts Studio User Guide.
                                                                            +
                                                                            1. DataArts Studio is a one-stop platform that provides data integration, development, and governance capabilities. DataArts Studio has no storage or computing capability and relies on the data lake base.
                                                                            2. Only one DataArts Studio instance can be bound to an enterprise project. If an enterprise project already has an instance, no more instance can be added.
                                                                            3. Different modules of DataArts Studio support different data sources. You need to select a data lake foundation based on your service requirements. For details about the data lakes supported by DataArts Studio, see "Management Center" > "Data Sources Supported by DataArts Studio" in DataArts Studio User Guide.

                                                                            Management Center

                                                                            1. Due to the constraints of Management Center, other components (such as DataArts Architecture, DataArts Quality, and DataArts Catalog) do not support databases or tables whose names contain Chinese characters or periods (.).
                                                                            2. You are advised to use different CDM clusters for a data connection agent in Management Center and a CDM migration job. If an agent and CDM job use the same cluster, they may contend for resources during peak hours, resulting in service unavailability.
                                                                            3. If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                                            4. If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                                              +
                                                                            1. Due to the constraints of Management Center, other modules (such as DataArts Architecture, DataArts Quality, and DataArts Catalog) do not support databases or tables whose names contain Chinese characters or periods (.).
                                                                            2. You are advised to use different CDM clusters for a data connection agent in Management Center and a CDM migration job. If an agent and CDM job use the same cluster, they may contend for resources during peak hours, resulting in service unavailability.
                                                                            3. If you use the same CDM cluster as the agent for multiple connections to MRS clusters with Kerberos authentication enabled, jobs will fail. You are advised to plan multiple CDM clusters based on service requirements.
                                                                            4. If a CDM cluster functions as the agent for a data connection in Management Center, the cluster supports a maximum of 200 concurrent active threads. If multiple data connections share an agent, a maximum of 200 SQL, Shell, and Python scripts submitted through the connections can run concurrently. Excess tasks will be queued. You are advised to plan multiple agents based on the workload.

                                                                            5. A maximum of 200 data connections can be created in a workspace.
                                                                            6. The concurrency restriction for APIs in Management Center is 100 QPS.

                                                                            DataArts Factory

                                                                            1. You can enable backup of assets such as scripts and jobs to OBS buckets. For details, see DataArts Factory > O&M and Scheduling > Managing Backups in DataArts Studio User Guide.
                                                                            2. The execution history of scripts, jobs, and nodes is stored in OBS buckets. If no OBS bucket is available, you cannot view the execution history.
                                                                            3. Resources from an HDFS can be used only by MRS Spark, MRS Flink Job, and MRS MapReduce nodes.
                                                                            4. A workspace can contain a maximum of 10,000 scripts, a maximum of 5,000 script directories, and a maximum of 10 directory levels.
                                                                            5. A workspace can contain a maximum of 10,000 jobs, a maximum of 5,000 job directories, and a maximum of 10 directory levels.
                                                                            6. A maximum of 1,000 execution results can be displayed for RDS SQL, DWS SQL, Hive SQL, DLI SQL, and Spark SQL scripts, and the data volume is less than 3 MB. If the number of execution results exceeds 1,000, you can dump them. A maximum of 10,000 execution results can be dumped.
                                                                            7. Only data of the last six months can be displayed on the Monitor Instance and Monitor PatchData pages.
                                                                            8. Only notification records of the last 30 days can be displayed.
                                                                            9. The download records age out every seven days. When aged out, download records and the data dumped to OBS are both deleted.
                                                                            +
                                                                            1. You can enable backup of assets such as scripts and jobs to OBS buckets. For details, see DataArts Factory > O&M and Scheduling > Managing Backups in DataArts Studio User Guide.
                                                                            2. The execution history of scripts, jobs, and nodes is stored in OBS buckets. If no OBS bucket is available, you cannot view the execution history.
                                                                            3. Resources from an HDFS can be used only by MRS Spark, MRS Flink Job, and MRS MapReduce nodes.
                                                                            4. A workspace can contain a maximum of 10,000 scripts (including SQL, Shell, and Python scripts), 5,000 script directories, and 10 directory levels.
                                                                            5. A workspace can contain a maximum of 10,000 jobs (including batch processing jobs, real-time processing jobs, offline migration jobs, and real-time migration jobs), 5,000 job directories, and 10 directory levels.
                                                                            6. A workspace can contain a maximum of 500 real-time jobs (including real-time processing jobs and real-time migration jobs).
                                                                            7. A maximum of 1,000 execution results can be displayed for RDS SQL, DWS SQL, Hive SQL, DLI SQL, and Spark SQL scripts, and the data volume is less than 3 MB. If the number of execution results exceeds 1,000, you can dump them. A maximum of 10,000 execution results or 3 MB data can be dumped.
                                                                            8. Only data of the last six months can be displayed on the Monitor Instance and Monitor PatchData pages.
                                                                            9. Only notification records of the last 30 days can be displayed.
                                                                            10. The download records age out every seven days. When aged out, download records and the data dumped to OBS are both deleted.

                                                                            DataArts Architecture

                                                                            1. DataArts Architecture supports ER modeling and dimensional modeling (only star models).
                                                                            2. The maximum size of a file to be imported is 4 MB. A maximum of 3,000 metrics can be imported. A maximum of 500 tables can be exported at a time.
                                                                            3. Lookup tables and data standards cannot be created in their root directories.
                                                                            4. The quotas for the objects in a workspace are as follows:
                                                                              • Subjects: 5,000
                                                                              • Data standard directories: 500; data standards: 20,000
                                                                              • Business metrics: 100,000
                                                                              • Atomic, derivative, and compound metrics: 5,000 for each
                                                                              +
                                                                            1. DataArts Architecture supports ER modeling, dimensional modeling (only star models), and data mart.
                                                                            2. The maximum size of a file to be imported is 4 MB. A maximum of 3,000 metrics can be imported. A maximum of 500 tables can be exported at a time.
                                                                            3. A maximum of 200 objects can be operated at a time in DataArts Architecture.
                                                                            4. The quotas for the objects in a workspace are as follows:
                                                                              • Subjects: 5,000
                                                                              • Data standard directories: 500; data standards: 20,000
                                                                              • Business metrics: 100,000
                                                                              • Atomic, derivative, and compound metrics: 5,000 for each
                                                                            5. The quotas for different custom objects are as follows:
                                                                              • Custom subjects: 10
                                                                              • Custom tables: 30
                                                                              • Custom attributes: 10
                                                                              • Custom business metrics: 50
                                                                              -
                                                                            +
                                                                          • The name of a physical model table can contain a maximum of 200 characters.
                                                                          • If you select Description, field comments of a table must be unique.
                                                                          • If DataArts Architecture uses MRS Spark connections and DataArts Catalog uses MRS Hive connections to collect data, and if there are multiple Hive connections in the same cluster, you must use all these Hive connections to collect data in DataArts Catalog. Otherwise, tables may not be found during reversing in DataArts Architecture.
                                                                          • DataArts Quality

                                                                            1. The execution duration of data quality jobs depends on the data engine. If the data engine does not have sufficient resources, the execution of data quality jobs may be slow.
                                                                            2. A maximum of 50 rules can be configured for a data quality job. If necessary, you can create multiple quality jobs.
                                                                            3. By default, a maximum of 1,000 SQL statements associated with a quality job of a data connection can be executed concurrently. Excess SQL statements will be queued. The value ranges from 10 to 1000.
                                                                            4. By default, a maximum of 10,000 SQL statements associated with a quality job in a region can be executed concurrently. Excess SQL statements will be queued.
                                                                            5. In the Instance Running Status and Instance Alarm Status areas on the Dashboard page on the Metric Monitoring page, data of the last seven days is displayed. On the Alarms, Scenarios, and Metrics pages, data of the last seven, 15, or 30 days can be displayed.
                                                                            6. In the Quantity Changes area on the Dashboard page on the Quality Monitoring page, data of 30 days can be displayed. In the Alarm Trend by Severity and Rule Quantity Trend areas, data of the last seven days can be displayed.
                                                                            7. Quality reports are generated in batches on the T+1 day and retained for 90 days.
                                                                            8. If you export a quality report to OBS, the report is exported to the OBS path for storing job logs configured for the workspace. The exported record is retained for three months.
                                                                            +
                                                                            1. The execution duration of quality jobs and comparison jobs depends on the data engine. If the data engine does not have sufficient resources, the execution of data quality jobs may be slow.
                                                                            2. A maximum of 50 subjobs (rules) can be configured for a quality job. If necessary, you can create multiple quality jobs.
                                                                            3. A maximum of five subjobs (rules) can be configured for a comparison job. If necessary, you can create multiple comparison jobs.
                                                                            4. Each subjob of a quality job or comparison job can have a maximum of 300 data objects (databases, tables, and fields).
                                                                            5. By default, a maximum of 1,000 SQL statements associated with a quality job of a data connection can be executed concurrently. Excess SQL statements will be queued. The value ranges from 10 to 1000.
                                                                            6. By default, a maximum of 10,000 SQL statements associated with a quality job in a region can be executed concurrently. Excess SQL statements will be queued.
                                                                            7. In the Quantity Changes area on the Dashboard page on the Quality Monitoring page, data of 30 days can be displayed. In the Alarm Trend by Severity and Rule Quantity Trend areas, data of the last seven days can be displayed.
                                                                            8. Quality reports are generated in batches on the T+1 day and retained for 90 days.
                                                                            9. If you export a quality report to OBS, the report is exported to the OBS path for storing job logs configured for the workspace. The exported record is retained for three months.

                                                                            DataArts Catalog

                                                                            1. A maximum of 100 metadata collection tasks can be created in a workspace.
                                                                            2. Metadata collection tasks can be obtained through DDL SQL statements of the engine. You are not advised to collect more than 1,000 tables through a single task. If necessary, you can create multiple collection tasks. In addition, you need to set the scheduling time and frequency properly based on your requirements to avoid heavy access and connection pressure on the engine. The recommended settings are as follows:
                                                                              • If your service requires a metadata validity period of one day, set the scheduling period to max(one day, one-off collection period). This rule also applies to other scenarios.
                                                                              • If your service mainly runs in the daytime, set a scheduling time in the night during which the metadata collection has the minimum impact on the data source. This rule also applies to other scenarios.
                                                                              -
                                                                            3. Only the jobs that are scheduled and executed in DataArts Factory generate data lineages. Tested jobs do not generate data lineages.
                                                                            4. Historical data connections of the last seven days, 15 days, or 30 days can be displayed on the Dashboard page on the Metadata Collection page.
                                                                            -

                                                                            DataArts DataService

                                                                            -
                                                                            1. The shared edition is designed only for development and testing. You are advised to use the exclusive edition which is superior to the shared edition.
                                                                            2. A maximum of five DataArts DataService Exclusive clusters can be created in a DataArts Studio instance. Each cluster must be associated with a workspace and cannot belong to multiple workspaces.
                                                                            3. After a DataArts DataService Exclusive cluster is created, its specifications cannot be modified, and its version cannot be upgraded.
                                                                            4. The maximum number of DataArts DataService Exclusive APIs that can be created in a DataArts Studio instance is the quota of DataArts DataService Exclusive APIs (5,000 by default) or the total API quotas of the clusters in the instance, whichever is smaller. For example, if the quota of DataArts DataService Exclusive APIs for a DataArts Studio instance is 5,000, and two clusters whose API quotas are 500 and 2,000 respectively have been created in the instance, a maximum of 2,500 DataArts DataService Exclusive APIs can be created in the instance.
                                                                            5. The maximum number of DataArts DataService Exclusive APIs that can be created in a workspace is the quota of DataArts DataService Exclusive APIs (configured in the workspace information) or the total API quotas of the clusters in the instance, whichever is smaller. For example, if the quota of DataArts DataService Exclusive APIs for a workspace is 800, and two clusters whose API quotas are both 500 have been created in the workspace, a maximum of 800 DataArts DataService Exclusive APIs can be created in the workspace.
                                                                            6. A maximum of 1,000 applications can be created in a workspace.
                                                                            7. A maximum of 500 throttling policies can be created in a workspace.
                                                                            8. DataArts DataService allows you to trace and save events. For each event, DataArts DataService records information such as the date, description, and time source (a cluster). Events are retained for 30 days.
                                                                            9. From the log of a DataArts DataService Exclusive cluster, you can only obtain the last 100 access records of the cluster, evenly from all nodes of the cluster.
                                                                            10. In the APIs Called, APIs Published, Top 5 APIs by Call Rate, Top 5 APIs by Call Duration, and Top 5 APIs by Call Quantity areas on the Overview page, data of the last 12 hours, one day, seven days, or 30 days can be displayed. The total number of API calls is the sum of the number of APIs made in the last seven days (excluding the current day).
                                                                            +
                                                                          • Only the jobs that are scheduled and executed in DataArts Factory generate data lineages. Tested jobs do not generate data lineages.
                                                                          • Historical data connections of the last seven days, 15 days, or 30 days can be displayed on the Dashboard page on the Metadata Collection page.
                                                                          • Table 1 DataArts Studio system-defined roles

                                                                            Role

                                                                            +
                                                                            - - - - - - - - @@ -42,8 +42,8 @@ -

                                                                            Roles or Policies for DataArts Studio Console

                                                                            Table 2 lists the permissions for the services on which DataArts Studio components depend. You are advised to configure the minimum DataArts Studio-level permissions of dependent services for developers. Table 3 lists the minimum permissions for developers on the services on which DataArts Studio depends.

                                                                            -

                                                                            The DARTS Administrator and DARTS User already have the administrator permissions of dependent services. If the DARTS User role is assigned to a common user or user group, the common user or user group may have more permissions of dependent services than required. To prevent this risk, you can manually delete the permissions of dependent services from the user group after assigning the DARTS User role to the user group, and then assign the minimum permissions of dependent services to the user group.

                                                                            +

                                                                            Roles or Policies for DataArts Studio Console

                                                                            Table 2 lists the permissions for the services on which DataArts Studio modules depend. You are advised to configure the minimum DataArts Studio-level permissions of dependent services for developers. Table 3 lists the minimum permissions for developers on the services on which DataArts Studio depends.

                                                                            +

                                                                            The DARTS Administrator and DARTS User already have the administrator permissions of dependent services. If the DARTS User role is assigned to a common user or user group, the common user or user group may have more permissions of dependent services than required. To prevent this risk, you can manually delete the permissions of dependent services from the user group after assigning the DARTS User role to the user group, and then assign the minimum permissions of dependent services to the user group.

                                                                            Table 1 DataArts Studio system-defined roles

                                                                            Role

                                                                            Description

                                                                            +

                                                                            Description

                                                                            Category

                                                                            +

                                                                            Type

                                                                            DARTS Administrator

                                                                            +

                                                                            DARTS Administrator

                                                                            Instance administrator who has all management permissions on a DataArts Studio instance and its workspaces, permissions of dependent services, and service operation permissions in all workspaces.

                                                                            -
                                                                            NOTE:

                                                                            Users assigned the Tenant Administrator role have all permissions for all services except IAM. In other words, users with the Tenant Administrator role can perform all operations in DataArts Studio.

                                                                            +

                                                                            Instance administrator who has all management permissions on a DataArts Studio instance and its workspaces, permissions of dependent services, and service operation permissions in all workspaces.

                                                                            +
                                                                            NOTE:

                                                                            Users assigned the Tenant Administrator role have all permissions for all services except IAM. In other words, users with the Tenant Administrator role can perform all operations in DataArts Studio.

                                                                            System-defined role

                                                                            +

                                                                            System-defined role

                                                                            DARTS User

                                                                            +

                                                                            DARTS User

                                                                            Common user who has permissions to view a DataArts Studio instance and its workspaces, and the permissions of dependent services. After assigned a role, a common user has permissions of the role to perform service operations.

                                                                            -
                                                                            Workspace roles include the preset admin, developer, deployer, operator, and viewer, and other custom roles. For details about the operation permissions of each role, see Permissions.
                                                                            • Admin: This role has all operation permissions in a workspace. You are advised to assign the admin role to the project owner, development owner, and O&M administrator.
                                                                            • Developer: This role has permissions to create and manage resources in a workspace. You are advised to assign this role to users who develop and process tasks.
                                                                            • Operator: This role has the operation permissions of services such as O&M and scheduling in a workspace, but cannot modify resources or configurations. You are advised to assign this role to users responsible for O&M management and status monitoring.
                                                                            • Viewer: This role can view data in a workspace but cannot perform any other operation. You are advised to assign this role to users who only need to view data in a workspace but do not need to perform operations.
                                                                            • Deployer: This role is unique to the enterprise mode and has permissions to release task packages in a workspace. In enterprise mode, when a developer submits a script or job version, the system generates a release task. After the developer confirms the release and the deployer approves the release request, the modified job is synchronized to the production environment.
                                                                            • Custom roles: If the preset roles cannot meet your requirements, you can create custom roles. You can configure permissions for such roles to meet the the principle of least privilege (PoLP).
                                                                            +

                                                                            Common user who has permissions to view a DataArts Studio instance and its workspaces, and the permissions of dependent services. After assigned a role, a common user has permissions of the role to perform service operations.

                                                                            +
                                                                            Workspace roles include the preset admin, developer, deployer, operator, and viewer, and other custom roles. For details about the operation permissions of each role, see Permissions.
                                                                            • Admin: This role has all operation permissions in a workspace. You are advised to assign the admin role to the project owner, development owner, and O&M administrator.
                                                                            • Developer: This role has permissions to create and manage resources in a workspace. You are advised to assign this role to users who develop and process tasks.
                                                                            • Operator: This role has the operation permissions of services such as O&M and scheduling in a workspace, but cannot modify resources or configurations. You are advised to assign this role to users responsible for O&M management and status monitoring.
                                                                            • Viewer: This role can view data in a workspace but cannot perform any other operation. You are advised to assign this role to users who only need to view data in a workspace but do not need to perform operations.
                                                                            • Deployer: This role is unique to the enterprise mode and has permissions to release task packages in a workspace. In enterprise mode, when a developer submits a script or job version, the system generates a release task. After the developer confirms the release and the deployer approves the release request, the modified job is synchronized to the production environment.
                                                                            • Custom roles: If the preset roles cannot meet your requirements, you can create custom roles You can configure permissions for such roles to meet the the principle of least privilege (PoLP).

                                                                            System-defined role

                                                                            +

                                                                            System-defined role

                                                                            - @@ -341,7 +339,7 @@ -
                                                                            Table 2 Roles or policies for the services on which the DataArts Studio console depends on

                                                                            Console Function

                                                                            @@ -106,7 +106,6 @@

                                                                            vpc:publicIps:get

                                                                            vpc:publicIps:list

                                                                            vpc:vpcs:get

                                                                            -

                                                                            vpc:port:get

                                                                            vpc:subnets:get

                                                                            Create MRS connections.

                                                                            @@ -128,7 +127,6 @@

                                                                            vpc:publicIps:list

                                                                            vpc:vpcs:get

                                                                            vpc:vpcs:list

                                                                            -

                                                                            vpc:port:get

                                                                            vpc:subnets:get

                                                                            vpc:securityGroups:get

                                                                            vpc:firewalls:list

                                                                            @@ -229,7 +227,7 @@

                                                                            Create RDS connections.

                                                                            RMS

                                                                            +

                                                                            Config

                                                                            rms:resources:list

                                                                            ces:metricData:list

                                                                            Query the CPU usage of the DLI queue on the Overview page.

                                                                            +

                                                                            Query the CPU usage of the DLI queue on the Overview page.

                                                                            GES

                                                                            @@ -620,7 +618,7 @@
                                                                            -
                                                                            - @@ -556,7 +578,7 @@ - @@ -620,6 +642,8 @@ diff --git a/docs/dataartsstudio/umn/dataartsstudio_12_0002.html b/docs/dataartsstudio/umn/dataartsstudio_12_0002.html deleted file mode 100644 index df4861cc8..000000000 --- a/docs/dataartsstudio/umn/dataartsstudio_12_0002.html +++ /dev/null @@ -1,25 +0,0 @@ - - - -

                                                                            Preparations

                                                                            - -

                                                                            -
                                                                            - - - diff --git a/docs/dataartsstudio/umn/dataartsstudio_12_0004.html b/docs/dataartsstudio/umn/dataartsstudio_12_0004.html index 6f99e4683..bcc5daa4a 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_12_0004.html +++ b/docs/dataartsstudio/umn/dataartsstudio_12_0004.html @@ -8,11 +8,13 @@
                                                                            - + + + + + + @@ -16,13 +30,13 @@
                                                                            Table 3 Minimum permissions for developers on the services on which DataArts Studio depends

                                                                            Permission Type

                                                                            +
                                                                            @@ -631,21 +629,21 @@ - - - - - + + + + + + + + + + + +
                                                                            Table 3 Minimum permissions for developers on the services on which DataArts Studio depends

                                                                            Permission Type

                                                                            Role/Policy-based permissions–system role

                                                                            Mandatory

                                                                            Mandatory

                                                                            +

                                                                            Mandatory

                                                                            Mandatory

                                                                            +

                                                                            Mandatory

                                                                            Mandatory

                                                                            +

                                                                            Mandatory

                                                                            Permission

                                                                            • DIS Operator
                                                                            • DIS User
                                                                            • (Optional and not recommended) SWR Admin
                                                                              NOTE:

                                                                              The image read permission in SWR is required only when a custom image is selected for a DLI Spark node of a job in DataArts Factory.

                                                                              +
                                                                            • DIS Operator
                                                                            • DIS User
                                                                            • (Optional and not recommended) SWR Admin
                                                                              NOTE:

                                                                              The image read permission in SWR is required only when a custom image is selected for a DLI Spark node of a job in DataArts Factory.

                                                                              You are advised to add the read permission of the image by referring to . You are not advised to directly assign the SWR Admin system role to users because this may result in excessive permissions.

                                                                            DataArtsStudio_PermissionsOfDependentServices_global: custom policy for a global dependent cloud service
                                                                            {
                                                                            +
                                                                            DataArtsStudio_PermissionsOfDependentServices_global: custom policy for a global dependent cloud service
                                                                            {
                                                                                 "Version": "1.1",
                                                                                 "Statement": [
                                                                                     {
                                                                            @@ -795,7 +793,6 @@
                                                                                             "vpc:publicIps:get",
                                                                                             "vpc:vpcs:get",
                                                                                             "vpc:vpcs:list",
                                                                            -                "vpc:port:get",
                                                                                             "vpc:subnets:get",
                                                                                             "vpc:securityGroups:get",
                                                                                             "vpc:firewalls:list",
                                                                            @@ -819,3 +816,10 @@
                                                                             
                                                                            + + \ No newline at end of file diff --git a/docs/dataartsstudio/umn/dataartsstudio_07_013.html b/docs/dataartsstudio/umn/dataartsstudio_07_013.html index c1064af7f..1b7dd06c4 100644 --- a/docs/dataartsstudio/umn/dataartsstudio_07_013.html +++ b/docs/dataartsstudio/umn/dataartsstudio_07_013.html @@ -388,6 +388,28 @@

                                                                            N

                                                                            Binding EIPs

                                                                            +

                                                                            Y

                                                                            +

                                                                            N

                                                                            +

                                                                            N

                                                                            +

                                                                            N

                                                                            +

                                                                            Unbinding EIPs

                                                                            +

                                                                            Y

                                                                            +

                                                                            N

                                                                            +

                                                                            N

                                                                            +

                                                                            N

                                                                            +
                                                                            @@ -478,7 +500,7 @@

                                                                            Y

                                                                            N

                                                                            +

                                                                            Y

                                                                            Y

                                                                            Y

                                                                            N

                                                                            +

                                                                            Y

                                                                            Y

                                                                            Y

                                                                            Y

                                                                            +
                                                                            NOTE:

                                                                            In enterprise mode, developers do not have the permission to create notifications.

                                                                            +

                                                                            N

                                                                            2025-05-10

                                                                            +

                                                                            2025-08-15

                                                                            +

                                                                            Remove images that are not applicable in the chapter.:

                                                                            + +

                                                                            2025-07-30

                                                                            +

                                                                            Update the following content:

                                                                            +
                                                                            • Adapt to the new version, update the documentation for the new version, and include feature descriptions and configuration-related content as the version updates.
                                                                            • The new version of the document has been optimized, including some chapter titles and content descriptions, but the essential content remains unchanged.
                                                                              For example, the first-level navigation "Preparations" has been integrated into the "User Guide," and "Preparations" has been removed. +
                                                                              +
                                                                            +

                                                                            2025-05-10

                                                                            Change system-defined roles to DARTS Administrator and DARTS User.

                                                                            2025-01-21

                                                                            Update the following sections to fix table breakage issue:

                                                                            - +

                                                                            2024-10-25

                                                                            Update the following sections:

                                                                            -
                                                                            • Management Center support distributed GaussDB connections. +
                                                                              • Management Center support distributed GaussDB connections.
                                                                              • DataArts Factory supports the following features.
                                                                                • Support for manual triggering of jobs.

                                                                                  The instances generated for a job are in Pending confirmation state and are executed only after manual confirmation if parameter Manual confirmation is selected for the job. For details, see Setting Up Scheduling for a Job Using the Batch Processing Mode.

                                                                                • Support scheduling of jobs based on a calendar.

                                                                                  Scheduling calendars can be created and associated with jobs. Jobs are executed normally on working days of the calendar, with dry run on non-working days. For details, see Configuring a Scheduling Calendar.

                                                                                • Support OBS Listening for periodic scheduling, which allows job scheduling to be triggered by OBS file listening.

                                                                                  If OBS listening is enabled in the scheduling configuration of a job, the job listens for files in the OBS path. If there is a file in the OBS path, and the upstream job is successful, the current job will be scheduled at the scheduling time. If there is no file in the OBS path, the job continues to listen for files until the listening duration ends. For details, see Setting Up Scheduling for a Job Using the Batch Processing Mode.

                                                                                  @@ -33,14 +47,14 @@

                                                                            2024-03-01

                                                                            Update the following sections:

                                                                            - +

                                                                            2023-04-30

                                                                            Update the following sections:

                                                                            - +

                                                                            2023-03-30

                                                                            diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270788044.png b/docs/dataartsstudio/umn/en-us_image_0000002234068868.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270788044.png rename to docs/dataartsstudio/umn/en-us_image_0000002234068868.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234075564.png b/docs/dataartsstudio/umn/en-us_image_0000002234075564.png new file mode 100644 index 000000000..a880af58e Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234075564.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847530.png b/docs/dataartsstudio/umn/en-us_image_0000002234075784.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847530.png rename to docs/dataartsstudio/umn/en-us_image_0000002234075784.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847522.png b/docs/dataartsstudio/umn/en-us_image_0000002234075804.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847522.png rename to docs/dataartsstudio/umn/en-us_image_0000002234075804.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790852.png b/docs/dataartsstudio/umn/en-us_image_0000002234075884.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790852.png rename to docs/dataartsstudio/umn/en-us_image_0000002234075884.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791012.png b/docs/dataartsstudio/umn/en-us_image_0000002234075964.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791012.png rename to docs/dataartsstudio/umn/en-us_image_0000002234075964.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440105.png b/docs/dataartsstudio/umn/en-us_image_0000002234076104.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440105.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076104.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847174.png b/docs/dataartsstudio/umn/en-us_image_0000002234076120.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847174.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076120.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791492.png b/docs/dataartsstudio/umn/en-us_image_0000002234076228.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791492.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076228.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405577.png b/docs/dataartsstudio/umn/en-us_image_0000002234076288.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305405577.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076288.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440853.png b/docs/dataartsstudio/umn/en-us_image_0000002234076300.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440853.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076300.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270788876.png b/docs/dataartsstudio/umn/en-us_image_0000002234076304.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270788876.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076304.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440845.png b/docs/dataartsstudio/umn/en-us_image_0000002234076308.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440845.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076308.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270788920.png b/docs/dataartsstudio/umn/en-us_image_0000002234076316.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270788920.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076316.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789456.png b/docs/dataartsstudio/umn/en-us_image_0000002234076364.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789456.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076364.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846318.png b/docs/dataartsstudio/umn/en-us_image_0000002234076372.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846318.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076372.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440145.png b/docs/dataartsstudio/umn/en-us_image_0000002234076400.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440145.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076400.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234076428.png b/docs/dataartsstudio/umn/en-us_image_0000002234076428.png new file mode 100644 index 000000000..0384e163f Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234076428.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847118.png b/docs/dataartsstudio/umn/en-us_image_0000002234076436.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847118.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076436.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270845686.png b/docs/dataartsstudio/umn/en-us_image_0000002234076524.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270845686.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076524.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270845238.png b/docs/dataartsstudio/umn/en-us_image_0000002234076600.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270845238.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076600.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439469.png b/docs/dataartsstudio/umn/en-us_image_0000002234076628.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439469.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076628.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848590.png b/docs/dataartsstudio/umn/en-us_image_0000002234076948.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848590.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076948.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848462.png b/docs/dataartsstudio/umn/en-us_image_0000002234076960.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848462.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076960.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441533.png b/docs/dataartsstudio/umn/en-us_image_0000002234076984.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441533.png rename to docs/dataartsstudio/umn/en-us_image_0000002234076984.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848606.png b/docs/dataartsstudio/umn/en-us_image_0000002234077004.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848606.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077004.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789076.png b/docs/dataartsstudio/umn/en-us_image_0000002234077100.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789076.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077100.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789624.png b/docs/dataartsstudio/umn/en-us_image_0000002234077148.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789624.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077148.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270845726.png b/docs/dataartsstudio/umn/en-us_image_0000002234077152.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270845726.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077152.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789600.png b/docs/dataartsstudio/umn/en-us_image_0000002234077160.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789600.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077160.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846502.png b/docs/dataartsstudio/umn/en-us_image_0000002234077176.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846502.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077176.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438709.png b/docs/dataartsstudio/umn/en-us_image_0000002234077236.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438709.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077236.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405525.png b/docs/dataartsstudio/umn/en-us_image_0000002234077296.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305405525.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077296.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406701.png b/docs/dataartsstudio/umn/en-us_image_0000002234077316.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406701.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077316.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791224.png b/docs/dataartsstudio/umn/en-us_image_0000002234077360.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791224.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077360.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848086.png b/docs/dataartsstudio/umn/en-us_image_0000002234077380.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848086.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077380.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441041.png b/docs/dataartsstudio/umn/en-us_image_0000002234077400.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441041.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077400.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441397.png b/docs/dataartsstudio/umn/en-us_image_0000002234077436.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441397.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077436.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848454.png b/docs/dataartsstudio/umn/en-us_image_0000002234077444.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848454.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077444.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441385.png b/docs/dataartsstudio/umn/en-us_image_0000002234077448.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441385.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077448.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848370.png b/docs/dataartsstudio/umn/en-us_image_0000002234077464.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848370.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077464.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441373.png b/docs/dataartsstudio/umn/en-us_image_0000002234077496.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441373.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077496.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790924.png b/docs/dataartsstudio/umn/en-us_image_0000002234077572.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790924.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077572.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847946.png b/docs/dataartsstudio/umn/en-us_image_0000002234077580.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847946.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077580.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270788772.png b/docs/dataartsstudio/umn/en-us_image_0000002234077588.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270788772.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077588.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790608.png b/docs/dataartsstudio/umn/en-us_image_0000002234077652.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790608.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077652.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407757.png b/docs/dataartsstudio/umn/en-us_image_0000002234077672.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407757.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077672.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234077736.png b/docs/dataartsstudio/umn/en-us_image_0000002234077736.png new file mode 100644 index 000000000..77b8dca18 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234077736.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439269.png b/docs/dataartsstudio/umn/en-us_image_0000002234077768.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439269.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077768.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407797.png b/docs/dataartsstudio/umn/en-us_image_0000002234077772.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407797.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077772.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439401.png b/docs/dataartsstudio/umn/en-us_image_0000002234077808.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439401.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077808.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439889.png b/docs/dataartsstudio/umn/en-us_image_0000002234077840.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439889.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077840.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406837.png b/docs/dataartsstudio/umn/en-us_image_0000002234077844.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406837.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077844.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406205.png b/docs/dataartsstudio/umn/en-us_image_0000002234077920.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406205.png rename to docs/dataartsstudio/umn/en-us_image_0000002234077920.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407277.png b/docs/dataartsstudio/umn/en-us_image_0000002234078204.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407277.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078204.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407281.png b/docs/dataartsstudio/umn/en-us_image_0000002234078220.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407281.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078220.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407121.png b/docs/dataartsstudio/umn/en-us_image_0000002234078240.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407121.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078240.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440161.png b/docs/dataartsstudio/umn/en-us_image_0000002234078248.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440161.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078248.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407129.png b/docs/dataartsstudio/umn/en-us_image_0000002234078264.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407129.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078264.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440173.png b/docs/dataartsstudio/umn/en-us_image_0000002234078284.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440173.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078284.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789964.png b/docs/dataartsstudio/umn/en-us_image_0000002234078360.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789964.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078360.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789552.png b/docs/dataartsstudio/umn/en-us_image_0000002234078364.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789552.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078364.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406917.png b/docs/dataartsstudio/umn/en-us_image_0000002234078784.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406917.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078784.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439725.png b/docs/dataartsstudio/umn/en-us_image_0000002234078864.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439725.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078864.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234078892.png b/docs/dataartsstudio/umn/en-us_image_0000002234078892.png new file mode 100644 index 000000000..d45382251 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234078892.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234078900.png b/docs/dataartsstudio/umn/en-us_image_0000002234078900.png new file mode 100644 index 000000000..eab9bb705 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234078900.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789844.png b/docs/dataartsstudio/umn/en-us_image_0000002234078916.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789844.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078916.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406613.png b/docs/dataartsstudio/umn/en-us_image_0000002234078960.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406613.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078960.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846666.png b/docs/dataartsstudio/umn/en-us_image_0000002234078972.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846666.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078972.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846658.png b/docs/dataartsstudio/umn/en-us_image_0000002234078980.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846658.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078980.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789796.png b/docs/dataartsstudio/umn/en-us_image_0000002234078988.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789796.png rename to docs/dataartsstudio/umn/en-us_image_0000002234078988.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790972.png b/docs/dataartsstudio/umn/en-us_image_0000002234079000.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790972.png rename to docs/dataartsstudio/umn/en-us_image_0000002234079000.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407725.png b/docs/dataartsstudio/umn/en-us_image_0000002234079008.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407725.png rename to docs/dataartsstudio/umn/en-us_image_0000002234079008.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440781.png b/docs/dataartsstudio/umn/en-us_image_0000002234079016.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440781.png rename to docs/dataartsstudio/umn/en-us_image_0000002234079016.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234079328.png b/docs/dataartsstudio/umn/en-us_image_0000002234079328.png new file mode 100644 index 000000000..b43a86d00 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234079328.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407937.png b/docs/dataartsstudio/umn/en-us_image_0000002234079400.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407937.png rename to docs/dataartsstudio/umn/en-us_image_0000002234079400.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846370.png b/docs/dataartsstudio/umn/en-us_image_0000002234079480.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846370.png rename to docs/dataartsstudio/umn/en-us_image_0000002234079480.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790052.png b/docs/dataartsstudio/umn/en-us_image_0000002234079692.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790052.png rename to docs/dataartsstudio/umn/en-us_image_0000002234079692.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234079932.png b/docs/dataartsstudio/umn/en-us_image_0000002234079932.png new file mode 100644 index 000000000..86fc6bf75 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234079932.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846750.png b/docs/dataartsstudio/umn/en-us_image_0000002234079976.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846750.png rename to docs/dataartsstudio/umn/en-us_image_0000002234079976.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406633.png b/docs/dataartsstudio/umn/en-us_image_0000002234079984.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406633.png rename to docs/dataartsstudio/umn/en-us_image_0000002234079984.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234079996.png b/docs/dataartsstudio/umn/en-us_image_0000002234079996.png new file mode 100644 index 000000000..e496e9cdc Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234079996.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846754.png b/docs/dataartsstudio/umn/en-us_image_0000002234080000.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846754.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080000.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846758.png b/docs/dataartsstudio/umn/en-us_image_0000002234080008.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846758.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080008.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406661.png b/docs/dataartsstudio/umn/en-us_image_0000002234080176.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406661.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080176.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791080.png b/docs/dataartsstudio/umn/en-us_image_0000002234080348.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791080.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080348.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791124.png b/docs/dataartsstudio/umn/en-us_image_0000002234080412.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791124.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080412.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234080432.png b/docs/dataartsstudio/umn/en-us_image_0000002234080432.png new file mode 100644 index 000000000..65d561dc2 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234080432.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234080476.png b/docs/dataartsstudio/umn/en-us_image_0000002234080476.png new file mode 100644 index 000000000..a24d840bd Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234080476.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234080564.png b/docs/dataartsstudio/umn/en-us_image_0000002234080564.png new file mode 100644 index 000000000..ca7aaf3f0 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234080564.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789884.png b/docs/dataartsstudio/umn/en-us_image_0000002234080568.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789884.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080568.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791088.png b/docs/dataartsstudio/umn/en-us_image_0000002234080616.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791088.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080616.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234080632.png b/docs/dataartsstudio/umn/en-us_image_0000002234080632.png new file mode 100644 index 000000000..6034fb20e Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234080632.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847954.png b/docs/dataartsstudio/umn/en-us_image_0000002234080640.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847954.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080640.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406473.png b/docs/dataartsstudio/umn/en-us_image_0000002234080688.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406473.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080688.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789764.png b/docs/dataartsstudio/umn/en-us_image_0000002234080700.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789764.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080700.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846598.png b/docs/dataartsstudio/umn/en-us_image_0000002234080752.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846598.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080752.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234080764.png b/docs/dataartsstudio/umn/en-us_image_0000002234080764.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234080764.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789740.png b/docs/dataartsstudio/umn/en-us_image_0000002234080788.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789740.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080788.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408129.png b/docs/dataartsstudio/umn/en-us_image_0000002234080828.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408129.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080828.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406385.png b/docs/dataartsstudio/umn/en-us_image_0000002234080928.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406385.png rename to docs/dataartsstudio/umn/en-us_image_0000002234080928.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847506.png b/docs/dataartsstudio/umn/en-us_image_0000002234081196.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847506.png rename to docs/dataartsstudio/umn/en-us_image_0000002234081196.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234081428.png b/docs/dataartsstudio/umn/en-us_image_0000002234081428.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234081428.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234081440.png b/docs/dataartsstudio/umn/en-us_image_0000002234081440.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234081440.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790116.png b/docs/dataartsstudio/umn/en-us_image_0000002234081548.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790116.png rename to docs/dataartsstudio/umn/en-us_image_0000002234081548.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234082252.png b/docs/dataartsstudio/umn/en-us_image_0000002234082252.png new file mode 100644 index 000000000..897fa3e72 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234082252.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408305.png b/docs/dataartsstudio/umn/en-us_image_0000002234082412.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408305.png rename to docs/dataartsstudio/umn/en-us_image_0000002234082412.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848466.png b/docs/dataartsstudio/umn/en-us_image_0000002234082492.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848466.png rename to docs/dataartsstudio/umn/en-us_image_0000002234082492.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234082736.png b/docs/dataartsstudio/umn/en-us_image_0000002234082736.png new file mode 100644 index 000000000..3367c6c6c Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234082736.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407373.png b/docs/dataartsstudio/umn/en-us_image_0000002234083444.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407373.png rename to docs/dataartsstudio/umn/en-us_image_0000002234083444.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234084820.png b/docs/dataartsstudio/umn/en-us_image_0000002234084820.png new file mode 100644 index 000000000..eeb6f0d9f Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234084820.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790808.png b/docs/dataartsstudio/umn/en-us_image_0000002234085024.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790808.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085024.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440625.png b/docs/dataartsstudio/umn/en-us_image_0000002234085036.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440625.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085036.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440441.png b/docs/dataartsstudio/umn/en-us_image_0000002234085076.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440441.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085076.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406585.png b/docs/dataartsstudio/umn/en-us_image_0000002234085136.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406585.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085136.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846914.png b/docs/dataartsstudio/umn/en-us_image_0000002234085212.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846914.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085212.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407605.png b/docs/dataartsstudio/umn/en-us_image_0000002234085224.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407605.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085224.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791264.png b/docs/dataartsstudio/umn/en-us_image_0000002234085352.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791264.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085352.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234085456.png b/docs/dataartsstudio/umn/en-us_image_0000002234085456.png new file mode 100644 index 000000000..ca1ab281d Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234085456.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790868.png b/docs/dataartsstudio/umn/en-us_image_0000002234085460.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790868.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085460.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406229.png b/docs/dataartsstudio/umn/en-us_image_0000002234085576.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406229.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085576.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406225.png b/docs/dataartsstudio/umn/en-us_image_0000002234085584.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406225.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085584.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790200.png b/docs/dataartsstudio/umn/en-us_image_0000002234085744.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790200.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085744.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440397.png b/docs/dataartsstudio/umn/en-us_image_0000002234085828.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440397.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085828.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790396.png b/docs/dataartsstudio/umn/en-us_image_0000002234085912.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790396.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085912.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791040.png b/docs/dataartsstudio/umn/en-us_image_0000002234085928.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791040.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085928.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848014.png b/docs/dataartsstudio/umn/en-us_image_0000002234085932.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848014.png rename to docs/dataartsstudio/umn/en-us_image_0000002234085932.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407765.png b/docs/dataartsstudio/umn/en-us_image_0000002234086156.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407765.png rename to docs/dataartsstudio/umn/en-us_image_0000002234086156.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407017.png b/docs/dataartsstudio/umn/en-us_image_0000002234086280.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407017.png rename to docs/dataartsstudio/umn/en-us_image_0000002234086280.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305404701.png b/docs/dataartsstudio/umn/en-us_image_0000002234228660.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305404701.png rename to docs/dataartsstudio/umn/en-us_image_0000002234228660.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440037.png b/docs/dataartsstudio/umn/en-us_image_0000002234235252.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440037.png rename to docs/dataartsstudio/umn/en-us_image_0000002234235252.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234235396.png b/docs/dataartsstudio/umn/en-us_image_0000002234235396.png new file mode 100644 index 000000000..9a1433c32 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234235396.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234235528.png b/docs/dataartsstudio/umn/en-us_image_0000002234235528.png new file mode 100644 index 000000000..64b0190c4 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234235528.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406389.png b/docs/dataartsstudio/umn/en-us_image_0000002234235552.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406389.png rename to docs/dataartsstudio/umn/en-us_image_0000002234235552.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234235580.png b/docs/dataartsstudio/umn/en-us_image_0000002234235580.png new file mode 100644 index 000000000..ed029bb22 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234235580.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234235616.png b/docs/dataartsstudio/umn/en-us_image_0000002234235616.png new file mode 100644 index 000000000..baae15c63 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234235616.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234235624.png b/docs/dataartsstudio/umn/en-us_image_0000002234235624.png new file mode 100644 index 000000000..f93f76971 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234235624.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270788796.png b/docs/dataartsstudio/umn/en-us_image_0000002234235668.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270788796.png rename to docs/dataartsstudio/umn/en-us_image_0000002234235668.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406965.png b/docs/dataartsstudio/umn/en-us_image_0000002234235716.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406965.png rename to docs/dataartsstudio/umn/en-us_image_0000002234235716.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847406.png b/docs/dataartsstudio/umn/en-us_image_0000002234235724.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847406.png rename to docs/dataartsstudio/umn/en-us_image_0000002234235724.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440285.png b/docs/dataartsstudio/umn/en-us_image_0000002234235780.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440285.png rename to docs/dataartsstudio/umn/en-us_image_0000002234235780.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790480.png b/docs/dataartsstudio/umn/en-us_image_0000002234235784.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790480.png rename to docs/dataartsstudio/umn/en-us_image_0000002234235784.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407745.png b/docs/dataartsstudio/umn/en-us_image_0000002234235800.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407745.png rename to docs/dataartsstudio/umn/en-us_image_0000002234235800.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790300.png b/docs/dataartsstudio/umn/en-us_image_0000002234235952.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790300.png rename to docs/dataartsstudio/umn/en-us_image_0000002234235952.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846498.png b/docs/dataartsstudio/umn/en-us_image_0000002234236140.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846498.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236140.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438677.png b/docs/dataartsstudio/umn/en-us_image_0000002234236144.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438677.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236144.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791044.png b/docs/dataartsstudio/umn/en-us_image_0000002234236152.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791044.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236152.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407585.png b/docs/dataartsstudio/umn/en-us_image_0000002234236192.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407585.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236192.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790368.png b/docs/dataartsstudio/umn/en-us_image_0000002234236216.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790368.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236216.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438865.png b/docs/dataartsstudio/umn/en-us_image_0000002234236240.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438865.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236240.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234236252.png b/docs/dataartsstudio/umn/en-us_image_0000002234236252.png new file mode 100644 index 000000000..f96bf0448 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234236252.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405845.png b/docs/dataartsstudio/umn/en-us_image_0000002234236264.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305405845.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236264.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406573.png b/docs/dataartsstudio/umn/en-us_image_0000002234236268.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406573.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236268.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406569.png b/docs/dataartsstudio/umn/en-us_image_0000002234236276.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406569.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236276.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270845798.png b/docs/dataartsstudio/umn/en-us_image_0000002234236364.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270845798.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236364.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847370.png b/docs/dataartsstudio/umn/en-us_image_0000002234236424.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847370.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236424.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270845810.png b/docs/dataartsstudio/umn/en-us_image_0000002234236592.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270845810.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236592.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234236680.png b/docs/dataartsstudio/umn/en-us_image_0000002234236680.png new file mode 100644 index 000000000..30e30b484 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234236680.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408481.png b/docs/dataartsstudio/umn/en-us_image_0000002234236776.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408481.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236776.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438965.png b/docs/dataartsstudio/umn/en-us_image_0000002234236792.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438965.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236792.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441541.png b/docs/dataartsstudio/umn/en-us_image_0000002234236804.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441541.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236804.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789060.png b/docs/dataartsstudio/umn/en-us_image_0000002234236836.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789060.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236836.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270845718.png b/docs/dataartsstudio/umn/en-us_image_0000002234236924.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270845718.png rename to docs/dataartsstudio/umn/en-us_image_0000002234236924.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406377.png b/docs/dataartsstudio/umn/en-us_image_0000002234237032.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406377.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237032.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438701.png b/docs/dataartsstudio/umn/en-us_image_0000002234237092.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438701.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237092.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791664.png b/docs/dataartsstudio/umn/en-us_image_0000002234237164.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791664.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237164.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441025.png b/docs/dataartsstudio/umn/en-us_image_0000002234237212.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441025.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237212.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791596.png b/docs/dataartsstudio/umn/en-us_image_0000002234237268.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791596.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237268.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440373.png b/docs/dataartsstudio/umn/en-us_image_0000002234237300.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440373.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237300.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791584.png b/docs/dataartsstudio/umn/en-us_image_0000002234237324.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791584.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237324.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440421.png b/docs/dataartsstudio/umn/en-us_image_0000002234237340.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440421.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237340.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791580.png b/docs/dataartsstudio/umn/en-us_image_0000002234237348.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791580.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237348.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234237496.png b/docs/dataartsstudio/umn/en-us_image_0000002234237496.png new file mode 100644 index 000000000..6a8c232c2 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234237496.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440409.png b/docs/dataartsstudio/umn/en-us_image_0000002234237504.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440409.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237504.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846826.png b/docs/dataartsstudio/umn/en-us_image_0000002234237516.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846826.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237516.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848626.png b/docs/dataartsstudio/umn/en-us_image_0000002234237528.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848626.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237528.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846334.png b/docs/dataartsstudio/umn/en-us_image_0000002234237616.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846334.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237616.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847706.png b/docs/dataartsstudio/umn/en-us_image_0000002234237728.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847706.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237728.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406665.png b/docs/dataartsstudio/umn/en-us_image_0000002234237740.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406665.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237740.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846954.png b/docs/dataartsstudio/umn/en-us_image_0000002234237788.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846954.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237788.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790132.png b/docs/dataartsstudio/umn/en-us_image_0000002234237800.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790132.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237800.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846998.png b/docs/dataartsstudio/umn/en-us_image_0000002234237808.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846998.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237808.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847086.jpg b/docs/dataartsstudio/umn/en-us_image_0000002234237944.jpg similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847086.jpg rename to docs/dataartsstudio/umn/en-us_image_0000002234237944.jpg diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791016.png b/docs/dataartsstudio/umn/en-us_image_0000002234237972.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791016.png rename to docs/dataartsstudio/umn/en-us_image_0000002234237972.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440181.png b/docs/dataartsstudio/umn/en-us_image_0000002234238072.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440181.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238072.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440433.png b/docs/dataartsstudio/umn/en-us_image_0000002234238200.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440433.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238200.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406281.png b/docs/dataartsstudio/umn/en-us_image_0000002234238204.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406281.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238204.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439385.png b/docs/dataartsstudio/umn/en-us_image_0000002234238260.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439385.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238260.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789584.png b/docs/dataartsstudio/umn/en-us_image_0000002234238264.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789584.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238264.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408217.png b/docs/dataartsstudio/umn/en-us_image_0000002234238280.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408217.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238280.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234238444.png b/docs/dataartsstudio/umn/en-us_image_0000002234238444.png new file mode 100644 index 000000000..905964577 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234238444.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234238460.png b/docs/dataartsstudio/umn/en-us_image_0000002234238460.png new file mode 100644 index 000000000..4f6815339 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234238460.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406933.png b/docs/dataartsstudio/umn/en-us_image_0000002234238624.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406933.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238624.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847054.png b/docs/dataartsstudio/umn/en-us_image_0000002234238636.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847054.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238636.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439965.png b/docs/dataartsstudio/umn/en-us_image_0000002234238656.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439965.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238656.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846742.png b/docs/dataartsstudio/umn/en-us_image_0000002234238748.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846742.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238748.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234238756.png b/docs/dataartsstudio/umn/en-us_image_0000002234238756.png new file mode 100644 index 000000000..b0bf7565a Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234238756.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234238764.png b/docs/dataartsstudio/umn/en-us_image_0000002234238764.png new file mode 100644 index 000000000..8f1e7dd22 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234238764.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789804.png b/docs/dataartsstudio/umn/en-us_image_0000002234238812.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789804.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238812.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846650.png b/docs/dataartsstudio/umn/en-us_image_0000002234238820.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846650.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238820.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790992.png b/docs/dataartsstudio/umn/en-us_image_0000002234238852.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790992.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238852.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790472.png b/docs/dataartsstudio/umn/en-us_image_0000002234238916.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790472.png rename to docs/dataartsstudio/umn/en-us_image_0000002234238916.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234238980.png b/docs/dataartsstudio/umn/en-us_image_0000002234238980.png new file mode 100644 index 000000000..3b8969fdc Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234238980.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305404981.png b/docs/dataartsstudio/umn/en-us_image_0000002234239000.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305404981.png rename to docs/dataartsstudio/umn/en-us_image_0000002234239000.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305404553.png b/docs/dataartsstudio/umn/en-us_image_0000002234239032.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305404553.png rename to docs/dataartsstudio/umn/en-us_image_0000002234239032.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407825.png b/docs/dataartsstudio/umn/en-us_image_0000002234239624.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407825.png rename to docs/dataartsstudio/umn/en-us_image_0000002234239624.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846314.png b/docs/dataartsstudio/umn/en-us_image_0000002234239680.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846314.png rename to docs/dataartsstudio/umn/en-us_image_0000002234239680.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406641.png b/docs/dataartsstudio/umn/en-us_image_0000002234239792.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406641.png rename to docs/dataartsstudio/umn/en-us_image_0000002234239792.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846746.png b/docs/dataartsstudio/umn/en-us_image_0000002234239808.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846746.png rename to docs/dataartsstudio/umn/en-us_image_0000002234239808.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406625.png b/docs/dataartsstudio/umn/en-us_image_0000002234239816.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406625.png rename to docs/dataartsstudio/umn/en-us_image_0000002234239816.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847038.png b/docs/dataartsstudio/umn/en-us_image_0000002234239844.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847038.png rename to docs/dataartsstudio/umn/en-us_image_0000002234239844.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439957.png b/docs/dataartsstudio/umn/en-us_image_0000002234239928.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439957.png rename to docs/dataartsstudio/umn/en-us_image_0000002234239928.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405869.png b/docs/dataartsstudio/umn/en-us_image_0000002234240048.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305405869.png rename to docs/dataartsstudio/umn/en-us_image_0000002234240048.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791656.png b/docs/dataartsstudio/umn/en-us_image_0000002234240156.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791656.png rename to docs/dataartsstudio/umn/en-us_image_0000002234240156.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790616.png b/docs/dataartsstudio/umn/en-us_image_0000002234240172.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790616.png rename to docs/dataartsstudio/umn/en-us_image_0000002234240172.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234240288.png b/docs/dataartsstudio/umn/en-us_image_0000002234240288.png new file mode 100644 index 000000000..4436578f7 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234240288.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440905.png b/docs/dataartsstudio/umn/en-us_image_0000002234240444.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440905.png rename to docs/dataartsstudio/umn/en-us_image_0000002234240444.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234240460.png b/docs/dataartsstudio/umn/en-us_image_0000002234240460.png new file mode 100644 index 000000000..08653227e Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234240460.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407829.png b/docs/dataartsstudio/umn/en-us_image_0000002234240472.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407829.png rename to docs/dataartsstudio/umn/en-us_image_0000002234240472.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791092.png b/docs/dataartsstudio/umn/en-us_image_0000002234240480.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791092.png rename to docs/dataartsstudio/umn/en-us_image_0000002234240480.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234240552.png b/docs/dataartsstudio/umn/en-us_image_0000002234240552.png new file mode 100644 index 000000000..45e6357b7 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234240552.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439549.png b/docs/dataartsstudio/umn/en-us_image_0000002234240612.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439549.png rename to docs/dataartsstudio/umn/en-us_image_0000002234240612.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846606.png b/docs/dataartsstudio/umn/en-us_image_0000002234240616.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846606.png rename to docs/dataartsstudio/umn/en-us_image_0000002234240616.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846618.png b/docs/dataartsstudio/umn/en-us_image_0000002234240632.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846618.png rename to docs/dataartsstudio/umn/en-us_image_0000002234240632.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405617.jpg b/docs/dataartsstudio/umn/en-us_image_0000002234240788.jpg similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305405617.jpg rename to docs/dataartsstudio/umn/en-us_image_0000002234240788.jpg diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847502.png b/docs/dataartsstudio/umn/en-us_image_0000002234241004.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847502.png rename to docs/dataartsstudio/umn/en-us_image_0000002234241004.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790636.png b/docs/dataartsstudio/umn/en-us_image_0000002234241012.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790636.png rename to docs/dataartsstudio/umn/en-us_image_0000002234241012.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407389.png b/docs/dataartsstudio/umn/en-us_image_0000002234241072.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407389.png rename to docs/dataartsstudio/umn/en-us_image_0000002234241072.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234241140.png b/docs/dataartsstudio/umn/en-us_image_0000002234241140.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234241140.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789756.png b/docs/dataartsstudio/umn/en-us_image_0000002234241420.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789756.png rename to docs/dataartsstudio/umn/en-us_image_0000002234241420.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440869.png b/docs/dataartsstudio/umn/en-us_image_0000002234241796.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440869.png rename to docs/dataartsstudio/umn/en-us_image_0000002234241796.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791064.png b/docs/dataartsstudio/umn/en-us_image_0000002234241808.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791064.png rename to docs/dataartsstudio/umn/en-us_image_0000002234241808.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407333.png b/docs/dataartsstudio/umn/en-us_image_0000002234242340.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407333.png rename to docs/dataartsstudio/umn/en-us_image_0000002234242340.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847586.png b/docs/dataartsstudio/umn/en-us_image_0000002234242960.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847586.png rename to docs/dataartsstudio/umn/en-us_image_0000002234242960.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441089.png b/docs/dataartsstudio/umn/en-us_image_0000002234243352.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441089.png rename to docs/dataartsstudio/umn/en-us_image_0000002234243352.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791280.png b/docs/dataartsstudio/umn/en-us_image_0000002234243360.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791280.png rename to docs/dataartsstudio/umn/en-us_image_0000002234243360.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848146.png b/docs/dataartsstudio/umn/en-us_image_0000002234244332.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848146.png rename to docs/dataartsstudio/umn/en-us_image_0000002234244332.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440333.png b/docs/dataartsstudio/umn/en-us_image_0000002234244360.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440333.png rename to docs/dataartsstudio/umn/en-us_image_0000002234244360.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002234244428.png b/docs/dataartsstudio/umn/en-us_image_0000002234244428.png new file mode 100644 index 000000000..d0ef43f8c Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002234244428.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791748.png b/docs/dataartsstudio/umn/en-us_image_0000002234244496.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791748.png rename to docs/dataartsstudio/umn/en-us_image_0000002234244496.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440621.png b/docs/dataartsstudio/umn/en-us_image_0000002234244824.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440621.png rename to docs/dataartsstudio/umn/en-us_image_0000002234244824.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789856.png b/docs/dataartsstudio/umn/en-us_image_0000002234244964.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789856.png rename to docs/dataartsstudio/umn/en-us_image_0000002234244964.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440657.png b/docs/dataartsstudio/umn/en-us_image_0000002234245040.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440657.png rename to docs/dataartsstudio/umn/en-us_image_0000002234245040.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440665.png b/docs/dataartsstudio/umn/en-us_image_0000002234245052.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440665.png rename to docs/dataartsstudio/umn/en-us_image_0000002234245052.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791160.jpg b/docs/dataartsstudio/umn/en-us_image_0000002234245436.jpg similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791160.jpg rename to docs/dataartsstudio/umn/en-us_image_0000002234245436.jpg diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846766.png b/docs/dataartsstudio/umn/en-us_image_0000002234245540.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846766.png rename to docs/dataartsstudio/umn/en-us_image_0000002234245540.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791644.png b/docs/dataartsstudio/umn/en-us_image_0000002234245572.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791644.png rename to docs/dataartsstudio/umn/en-us_image_0000002234245572.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408061.png b/docs/dataartsstudio/umn/en-us_image_0000002234245684.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408061.png rename to docs/dataartsstudio/umn/en-us_image_0000002234245684.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440949.png b/docs/dataartsstudio/umn/en-us_image_0000002234245708.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440949.png rename to docs/dataartsstudio/umn/en-us_image_0000002234245708.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848022.png b/docs/dataartsstudio/umn/en-us_image_0000002234245752.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848022.png rename to docs/dataartsstudio/umn/en-us_image_0000002234245752.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002236648476.png b/docs/dataartsstudio/umn/en-us_image_0000002236648476.png new file mode 100644 index 000000000..172f64c87 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002236648476.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002236652800.png b/docs/dataartsstudio/umn/en-us_image_0000002236652800.png new file mode 100644 index 000000000..5142e68a0 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002236652800.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002236808296.png b/docs/dataartsstudio/umn/en-us_image_0000002236808296.png new file mode 100644 index 000000000..172f64c87 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002236808296.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846470.png b/docs/dataartsstudio/umn/en-us_image_0000002269114701.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846470.png rename to docs/dataartsstudio/umn/en-us_image_0000002269114701.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269114769.png b/docs/dataartsstudio/umn/en-us_image_0000002269114769.png new file mode 100644 index 000000000..a03054998 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269114769.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790172.png b/docs/dataartsstudio/umn/en-us_image_0000002269114785.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790172.png rename to docs/dataartsstudio/umn/en-us_image_0000002269114785.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269114801.png b/docs/dataartsstudio/umn/en-us_image_0000002269114801.png new file mode 100644 index 000000000..4dd37ca7a Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269114801.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848170.png b/docs/dataartsstudio/umn/en-us_image_0000002269114877.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848170.png rename to docs/dataartsstudio/umn/en-us_image_0000002269114877.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848166.png b/docs/dataartsstudio/umn/en-us_image_0000002269114889.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848166.png rename to docs/dataartsstudio/umn/en-us_image_0000002269114889.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269114909.png b/docs/dataartsstudio/umn/en-us_image_0000002269114909.png new file mode 100644 index 000000000..751063166 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269114909.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407393.png b/docs/dataartsstudio/umn/en-us_image_0000002269114989.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407393.png rename to docs/dataartsstudio/umn/en-us_image_0000002269114989.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269115061.png b/docs/dataartsstudio/umn/en-us_image_0000002269115061.png new file mode 100644 index 000000000..879c51d61 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269115061.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847842.png b/docs/dataartsstudio/umn/en-us_image_0000002269115113.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847842.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115113.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407225.png b/docs/dataartsstudio/umn/en-us_image_0000002269115137.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407225.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115137.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847350.png b/docs/dataartsstudio/umn/en-us_image_0000002269115141.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847350.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115141.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790316.png b/docs/dataartsstudio/umn/en-us_image_0000002269115341.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790316.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115341.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791496.png b/docs/dataartsstudio/umn/en-us_image_0000002269115445.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791496.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115445.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438645.png b/docs/dataartsstudio/umn/en-us_image_0000002269115493.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438645.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115493.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440849.png b/docs/dataartsstudio/umn/en-us_image_0000002269115501.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440849.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115501.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791048.png b/docs/dataartsstudio/umn/en-us_image_0000002269115513.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791048.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115513.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405497.png b/docs/dataartsstudio/umn/en-us_image_0000002269115561.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305405497.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115561.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847222.png b/docs/dataartsstudio/umn/en-us_image_0000002269115569.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847222.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115569.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847218.png b/docs/dataartsstudio/umn/en-us_image_0000002269115597.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847218.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115597.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269115609.png b/docs/dataartsstudio/umn/en-us_image_0000002269115609.png new file mode 100644 index 000000000..a020ce4bd Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269115609.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440177.png b/docs/dataartsstudio/umn/en-us_image_0000002269115617.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440177.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115617.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407005.png b/docs/dataartsstudio/umn/en-us_image_0000002269115641.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407005.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115641.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270845678.png b/docs/dataartsstudio/umn/en-us_image_0000002269115709.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270845678.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115709.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438625.png b/docs/dataartsstudio/umn/en-us_image_0000002269115725.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438625.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115725.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439869.png b/docs/dataartsstudio/umn/en-us_image_0000002269115869.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439869.png rename to docs/dataartsstudio/umn/en-us_image_0000002269115869.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407193.png b/docs/dataartsstudio/umn/en-us_image_0000002269116013.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407193.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116013.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791728.png b/docs/dataartsstudio/umn/en-us_image_0000002269116113.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791728.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116113.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846026.png b/docs/dataartsstudio/umn/en-us_image_0000002269116145.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846026.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116145.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791744.png b/docs/dataartsstudio/umn/en-us_image_0000002269116149.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791744.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116149.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441537.png b/docs/dataartsstudio/umn/en-us_image_0000002269116161.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441537.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116161.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791740.png b/docs/dataartsstudio/umn/en-us_image_0000002269116181.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791740.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116181.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791724.png b/docs/dataartsstudio/umn/en-us_image_0000002269116221.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791724.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116221.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438749.png b/docs/dataartsstudio/umn/en-us_image_0000002269116277.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438749.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116277.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847890.png b/docs/dataartsstudio/umn/en-us_image_0000002269116369.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847890.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116369.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269116385.png b/docs/dataartsstudio/umn/en-us_image_0000002269116385.png new file mode 100644 index 000000000..9149e09af Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269116385.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406329.png b/docs/dataartsstudio/umn/en-us_image_0000002269116389.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406329.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116389.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438925.png b/docs/dataartsstudio/umn/en-us_image_0000002269116429.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438925.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116429.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305437605.png b/docs/dataartsstudio/umn/en-us_image_0000002269116513.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305437605.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116513.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791660.png b/docs/dataartsstudio/umn/en-us_image_0000002269116521.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791660.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116521.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847494.png b/docs/dataartsstudio/umn/en-us_image_0000002269116529.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847494.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116529.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848090.png b/docs/dataartsstudio/umn/en-us_image_0000002269116577.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848090.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116577.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791240.png b/docs/dataartsstudio/umn/en-us_image_0000002269116581.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791240.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116581.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791220.png b/docs/dataartsstudio/umn/en-us_image_0000002269116601.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791220.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116601.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441381.png b/docs/dataartsstudio/umn/en-us_image_0000002269116637.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441381.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116637.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441389.png b/docs/dataartsstudio/umn/en-us_image_0000002269116645.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441389.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116645.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790928.png b/docs/dataartsstudio/umn/en-us_image_0000002269116789.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790928.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116789.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440645.png b/docs/dataartsstudio/umn/en-us_image_0000002269116797.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440645.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116797.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846838.png b/docs/dataartsstudio/umn/en-us_image_0000002269116869.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846838.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116869.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791764.png b/docs/dataartsstudio/umn/en-us_image_0000002269116885.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791764.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116885.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441553.png b/docs/dataartsstudio/umn/en-us_image_0000002269116909.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441553.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116909.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789476.png b/docs/dataartsstudio/umn/en-us_image_0000002269116973.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789476.png rename to docs/dataartsstudio/umn/en-us_image_0000002269116973.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847690.png b/docs/dataartsstudio/umn/en-us_image_0000002269117093.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847690.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117093.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847362.png b/docs/dataartsstudio/umn/en-us_image_0000002269117181.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847362.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117181.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847358.png b/docs/dataartsstudio/umn/en-us_image_0000002269117185.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847358.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117185.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790240.jpg b/docs/dataartsstudio/umn/en-us_image_0000002269117305.jpg similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790240.jpg rename to docs/dataartsstudio/umn/en-us_image_0000002269117305.jpg diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407377.png b/docs/dataartsstudio/umn/en-us_image_0000002269117313.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407377.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117313.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847214.png b/docs/dataartsstudio/umn/en-us_image_0000002269117457.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847214.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117457.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440189.png b/docs/dataartsstudio/umn/en-us_image_0000002269117469.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440189.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117469.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847386.png b/docs/dataartsstudio/umn/en-us_image_0000002269117481.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847386.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117481.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441449.png b/docs/dataartsstudio/umn/en-us_image_0000002269117553.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441449.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117553.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441401.png b/docs/dataartsstudio/umn/en-us_image_0000002269117557.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441401.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117557.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406705.png b/docs/dataartsstudio/umn/en-us_image_0000002269117565.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406705.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117565.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790624.png b/docs/dataartsstudio/umn/en-us_image_0000002269117569.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790624.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117569.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440417.png b/docs/dataartsstudio/umn/en-us_image_0000002269117573.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440417.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117573.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441245.png b/docs/dataartsstudio/umn/en-us_image_0000002269117649.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441245.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117649.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408213.png b/docs/dataartsstudio/umn/en-us_image_0000002269117665.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408213.png rename to docs/dataartsstudio/umn/en-us_image_0000002269117665.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406657.png b/docs/dataartsstudio/umn/en-us_image_0000002269118053.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406657.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118053.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846782.png b/docs/dataartsstudio/umn/en-us_image_0000002269118061.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846782.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118061.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406617.png b/docs/dataartsstudio/umn/en-us_image_0000002269118105.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406617.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118105.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269118113.png b/docs/dataartsstudio/umn/en-us_image_0000002269118113.png new file mode 100644 index 000000000..901446ec8 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269118113.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846710.png b/docs/dataartsstudio/umn/en-us_image_0000002269118121.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846710.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118121.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790456.png b/docs/dataartsstudio/umn/en-us_image_0000002269118145.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790456.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118145.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846670.png b/docs/dataartsstudio/umn/en-us_image_0000002269118173.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846670.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118173.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791288.png b/docs/dataartsstudio/umn/en-us_image_0000002269118185.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791288.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118185.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440801.png b/docs/dataartsstudio/umn/en-us_image_0000002269118193.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440801.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118193.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407721.png b/docs/dataartsstudio/umn/en-us_image_0000002269118201.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407721.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118201.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791308.png b/docs/dataartsstudio/umn/en-us_image_0000002269118281.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791308.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118281.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407285.png b/docs/dataartsstudio/umn/en-us_image_0000002269118469.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407285.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118469.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269118525.png b/docs/dataartsstudio/umn/en-us_image_0000002269118525.png new file mode 100644 index 000000000..e8fa01c41 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269118525.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269118533.png b/docs/dataartsstudio/umn/en-us_image_0000002269118533.png new file mode 100644 index 000000000..0e1b34c67 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269118533.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847198.png b/docs/dataartsstudio/umn/en-us_image_0000002269118725.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847198.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118725.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439325.png b/docs/dataartsstudio/umn/en-us_image_0000002269118733.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439325.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118733.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846374.png b/docs/dataartsstudio/umn/en-us_image_0000002269118737.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846374.png rename to docs/dataartsstudio/umn/en-us_image_0000002269118737.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269118889.png b/docs/dataartsstudio/umn/en-us_image_0000002269118889.png new file mode 100644 index 000000000..37fb04656 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269118889.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847938.png b/docs/dataartsstudio/umn/en-us_image_0000002269119041.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847938.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119041.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406621.png b/docs/dataartsstudio/umn/en-us_image_0000002269119133.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406621.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119133.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406629.png b/docs/dataartsstudio/umn/en-us_image_0000002269119161.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406629.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119161.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269119177.png b/docs/dataartsstudio/umn/en-us_image_0000002269119177.png new file mode 100644 index 000000000..c9bba553d Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269119177.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407009.png b/docs/dataartsstudio/umn/en-us_image_0000002269119309.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407009.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119309.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270788384.png b/docs/dataartsstudio/umn/en-us_image_0000002269119389.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270788384.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119389.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270788176.png b/docs/dataartsstudio/umn/en-us_image_0000002269119541.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270788176.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119541.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789976.png b/docs/dataartsstudio/umn/en-us_image_0000002269119545.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789976.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119545.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269119629.png b/docs/dataartsstudio/umn/en-us_image_0000002269119629.png new file mode 100644 index 000000000..3664b6db9 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269119629.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269119645.png b/docs/dataartsstudio/umn/en-us_image_0000002269119645.png new file mode 100644 index 000000000..08f1f0774 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269119645.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269119681.png b/docs/dataartsstudio/umn/en-us_image_0000002269119681.png new file mode 100644 index 000000000..7f6e27c73 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269119681.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269119697.png b/docs/dataartsstudio/umn/en-us_image_0000002269119697.png new file mode 100644 index 000000000..3e45a046c Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269119697.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406909.png b/docs/dataartsstudio/umn/en-us_image_0000002269119761.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406909.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119761.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440901.png b/docs/dataartsstudio/umn/en-us_image_0000002269119817.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440901.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119817.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791100.png b/docs/dataartsstudio/umn/en-us_image_0000002269119825.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791100.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119825.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789500.png b/docs/dataartsstudio/umn/en-us_image_0000002269119869.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789500.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119869.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269119953.png b/docs/dataartsstudio/umn/en-us_image_0000002269119953.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269119953.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439561.png b/docs/dataartsstudio/umn/en-us_image_0000002269119961.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439561.png rename to docs/dataartsstudio/umn/en-us_image_0000002269119961.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269119985.png b/docs/dataartsstudio/umn/en-us_image_0000002269119985.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269119985.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441189.png b/docs/dataartsstudio/umn/en-us_image_0000002269120029.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441189.png rename to docs/dataartsstudio/umn/en-us_image_0000002269120029.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848246.png b/docs/dataartsstudio/umn/en-us_image_0000002269120033.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848246.png rename to docs/dataartsstudio/umn/en-us_image_0000002269120033.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440449.png b/docs/dataartsstudio/umn/en-us_image_0000002269120405.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440449.png rename to docs/dataartsstudio/umn/en-us_image_0000002269120405.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269120509.png b/docs/dataartsstudio/umn/en-us_image_0000002269120509.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269120509.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269120589.png b/docs/dataartsstudio/umn/en-us_image_0000002269120589.png new file mode 100644 index 000000000..d26397483 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269120589.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269120645.png b/docs/dataartsstudio/umn/en-us_image_0000002269120645.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269120645.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269120701.png b/docs/dataartsstudio/umn/en-us_image_0000002269120701.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269120701.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791148.png b/docs/dataartsstudio/umn/en-us_image_0000002269120705.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791148.png rename to docs/dataartsstudio/umn/en-us_image_0000002269120705.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789432.png b/docs/dataartsstudio/umn/en-us_image_0000002269120765.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789432.png rename to docs/dataartsstudio/umn/en-us_image_0000002269120765.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846978.png b/docs/dataartsstudio/umn/en-us_image_0000002269121457.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846978.png rename to docs/dataartsstudio/umn/en-us_image_0000002269121457.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269121561.png b/docs/dataartsstudio/umn/en-us_image_0000002269121561.png new file mode 100644 index 000000000..e316c01c9 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269121561.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440377.png b/docs/dataartsstudio/umn/en-us_image_0000002269121685.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440377.png rename to docs/dataartsstudio/umn/en-us_image_0000002269121685.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847462.png b/docs/dataartsstudio/umn/en-us_image_0000002269121693.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847462.png rename to docs/dataartsstudio/umn/en-us_image_0000002269121693.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847446.png b/docs/dataartsstudio/umn/en-us_image_0000002269121789.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847446.png rename to docs/dataartsstudio/umn/en-us_image_0000002269121789.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269121941.png b/docs/dataartsstudio/umn/en-us_image_0000002269121941.png new file mode 100644 index 000000000..fd17ed672 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269121941.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269121969.png b/docs/dataartsstudio/umn/en-us_image_0000002269121969.png new file mode 100644 index 000000000..02786b931 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269121969.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846450.png b/docs/dataartsstudio/umn/en-us_image_0000002269122377.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846450.png rename to docs/dataartsstudio/umn/en-us_image_0000002269122377.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441085.png b/docs/dataartsstudio/umn/en-us_image_0000002269123729.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441085.png rename to docs/dataartsstudio/umn/en-us_image_0000002269123729.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440337.png b/docs/dataartsstudio/umn/en-us_image_0000002269123741.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440337.png rename to docs/dataartsstudio/umn/en-us_image_0000002269123741.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406805.png b/docs/dataartsstudio/umn/en-us_image_0000002269124413.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406805.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124413.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441069.png b/docs/dataartsstudio/umn/en-us_image_0000002269124549.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441069.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124549.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848126.png b/docs/dataartsstudio/umn/en-us_image_0000002269124561.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848126.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124561.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407901.png b/docs/dataartsstudio/umn/en-us_image_0000002269124641.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407901.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124641.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789604.png b/docs/dataartsstudio/umn/en-us_image_0000002269124649.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789604.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124649.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440889.png b/docs/dataartsstudio/umn/en-us_image_0000002269124773.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440889.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124773.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407289.png b/docs/dataartsstudio/umn/en-us_image_0000002269124789.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407289.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124789.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440029.png b/docs/dataartsstudio/umn/en-us_image_0000002269124797.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440029.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124797.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269124893.png b/docs/dataartsstudio/umn/en-us_image_0000002269124893.png new file mode 100644 index 000000000..ed5555035 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269124893.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407049.png b/docs/dataartsstudio/umn/en-us_image_0000002269124905.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407049.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124905.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269124977.png b/docs/dataartsstudio/umn/en-us_image_0000002269124977.png new file mode 100644 index 000000000..4910efa54 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269124977.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790400.png b/docs/dataartsstudio/umn/en-us_image_0000002269124989.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790400.png rename to docs/dataartsstudio/umn/en-us_image_0000002269124989.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847814.png b/docs/dataartsstudio/umn/en-us_image_0000002269125049.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847814.png rename to docs/dataartsstudio/umn/en-us_image_0000002269125049.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407893.png b/docs/dataartsstudio/umn/en-us_image_0000002269125109.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407893.png rename to docs/dataartsstudio/umn/en-us_image_0000002269125109.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270844914.png b/docs/dataartsstudio/umn/en-us_image_0000002269188109.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270844914.png rename to docs/dataartsstudio/umn/en-us_image_0000002269188109.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789428.png b/docs/dataartsstudio/umn/en-us_image_0000002269194761.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789428.png rename to docs/dataartsstudio/umn/en-us_image_0000002269194761.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848222.png b/docs/dataartsstudio/umn/en-us_image_0000002269194845.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848222.png rename to docs/dataartsstudio/umn/en-us_image_0000002269194845.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439953.png b/docs/dataartsstudio/umn/en-us_image_0000002269194989.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439953.png rename to docs/dataartsstudio/umn/en-us_image_0000002269194989.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269195025.png b/docs/dataartsstudio/umn/en-us_image_0000002269195025.png new file mode 100644 index 000000000..a5a6b4817 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269195025.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847458.png b/docs/dataartsstudio/umn/en-us_image_0000002269195049.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847458.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195049.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269195065.png b/docs/dataartsstudio/umn/en-us_image_0000002269195065.png new file mode 100644 index 000000000..457f17d0c Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269195065.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790996.png b/docs/dataartsstudio/umn/en-us_image_0000002269195201.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790996.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195201.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790476.png b/docs/dataartsstudio/umn/en-us_image_0000002269195221.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790476.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195221.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847866.png b/docs/dataartsstudio/umn/en-us_image_0000002269195241.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847866.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195241.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269195369.png b/docs/dataartsstudio/umn/en-us_image_0000002269195369.png new file mode 100644 index 000000000..27012f002 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269195369.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269195381.png b/docs/dataartsstudio/umn/en-us_image_0000002269195381.png new file mode 100644 index 000000000..7c87efdad Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269195381.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790320.png b/docs/dataartsstudio/umn/en-us_image_0000002269195385.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790320.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195385.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405569.png b/docs/dataartsstudio/umn/en-us_image_0000002269195577.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305405569.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195577.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438637.png b/docs/dataartsstudio/umn/en-us_image_0000002269195581.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438637.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195581.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407093.png b/docs/dataartsstudio/umn/en-us_image_0000002269195641.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407093.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195641.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405713.png b/docs/dataartsstudio/umn/en-us_image_0000002269195661.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305405713.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195661.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847230.png b/docs/dataartsstudio/umn/en-us_image_0000002269195669.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847230.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195669.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269195693.png b/docs/dataartsstudio/umn/en-us_image_0000002269195693.png new file mode 100644 index 000000000..88ebb8747 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269195693.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270788936.png b/docs/dataartsstudio/umn/en-us_image_0000002269195801.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270788936.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195801.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438737.png b/docs/dataartsstudio/umn/en-us_image_0000002269195813.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438737.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195813.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440313.png b/docs/dataartsstudio/umn/en-us_image_0000002269195869.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440313.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195869.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438717.png b/docs/dataartsstudio/umn/en-us_image_0000002269195881.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438717.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195881.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438813.png b/docs/dataartsstudio/umn/en-us_image_0000002269195897.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438813.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195897.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439857.png b/docs/dataartsstudio/umn/en-us_image_0000002269195969.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439857.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195969.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439529.png b/docs/dataartsstudio/umn/en-us_image_0000002269195981.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439529.png rename to docs/dataartsstudio/umn/en-us_image_0000002269195981.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438569.png b/docs/dataartsstudio/umn/en-us_image_0000002269196149.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438569.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196149.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438973.png b/docs/dataartsstudio/umn/en-us_image_0000002269196181.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438973.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196181.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408477.png b/docs/dataartsstudio/umn/en-us_image_0000002269196209.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408477.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196209.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791732.png b/docs/dataartsstudio/umn/en-us_image_0000002269196257.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791732.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196257.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789124.png b/docs/dataartsstudio/umn/en-us_image_0000002269196341.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789124.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196341.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789116.png b/docs/dataartsstudio/umn/en-us_image_0000002269196349.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789116.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196349.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846494.png b/docs/dataartsstudio/umn/en-us_image_0000002269196453.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846494.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196453.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441461.png b/docs/dataartsstudio/umn/en-us_image_0000002269196601.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441461.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196601.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791236.png b/docs/dataartsstudio/umn/en-us_image_0000002269196641.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791236.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196641.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441529.png b/docs/dataartsstudio/umn/en-us_image_0000002269196709.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441529.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196709.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408241.png b/docs/dataartsstudio/umn/en-us_image_0000002269196733.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408241.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196733.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408325.png b/docs/dataartsstudio/umn/en-us_image_0000002269196741.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408325.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196741.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791576.png b/docs/dataartsstudio/umn/en-us_image_0000002269196749.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791576.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196749.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408333.png b/docs/dataartsstudio/umn/en-us_image_0000002269196757.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408333.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196757.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791588.png b/docs/dataartsstudio/umn/en-us_image_0000002269196765.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791588.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196765.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441393.png b/docs/dataartsstudio/umn/en-us_image_0000002269196781.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441393.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196781.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846430.png b/docs/dataartsstudio/umn/en-us_image_0000002269196933.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846430.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196933.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441465.png b/docs/dataartsstudio/umn/en-us_image_0000002269196941.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441465.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196941.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791752.png b/docs/dataartsstudio/umn/en-us_image_0000002269196981.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791752.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196981.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441565.png b/docs/dataartsstudio/umn/en-us_image_0000002269196997.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441565.png rename to docs/dataartsstudio/umn/en-us_image_0000002269196997.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791060.png b/docs/dataartsstudio/umn/en-us_image_0000002269197053.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791060.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197053.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440237.png b/docs/dataartsstudio/umn/en-us_image_0000002269197141.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440237.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197141.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847702.png b/docs/dataartsstudio/umn/en-us_image_0000002269197209.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847702.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197209.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846958.png b/docs/dataartsstudio/umn/en-us_image_0000002269197229.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846958.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197229.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846962.png b/docs/dataartsstudio/umn/en-us_image_0000002269197233.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846962.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197233.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790136.png b/docs/dataartsstudio/umn/en-us_image_0000002269197245.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790136.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197245.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407245.png b/docs/dataartsstudio/umn/en-us_image_0000002269197257.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407245.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197257.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440089.png b/docs/dataartsstudio/umn/en-us_image_0000002269197449.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440089.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197449.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439397.png b/docs/dataartsstudio/umn/en-us_image_0000002269197469.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439397.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197469.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847398.png b/docs/dataartsstudio/umn/en-us_image_0000002269197485.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847398.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197485.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847226.png b/docs/dataartsstudio/umn/en-us_image_0000002269197513.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847226.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197513.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848502.png b/docs/dataartsstudio/umn/en-us_image_0000002269197897.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270848502.png rename to docs/dataartsstudio/umn/en-us_image_0000002269197897.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269197901.png b/docs/dataartsstudio/umn/en-us_image_0000002269197901.png new file mode 100644 index 000000000..7d056a89c Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269197901.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406925.png b/docs/dataartsstudio/umn/en-us_image_0000002269198065.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406925.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198065.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406921.png b/docs/dataartsstudio/umn/en-us_image_0000002269198077.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406921.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198077.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406929.png b/docs/dataartsstudio/umn/en-us_image_0000002269198105.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406929.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198105.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789488.png b/docs/dataartsstudio/umn/en-us_image_0000002269198113.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789488.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198113.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269198189.png b/docs/dataartsstudio/umn/en-us_image_0000002269198189.png new file mode 100644 index 000000000..f7c9ee368 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269198189.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846706.png b/docs/dataartsstudio/umn/en-us_image_0000002269198197.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846706.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198197.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789888.png b/docs/dataartsstudio/umn/en-us_image_0000002269198213.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789888.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198213.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789664.png b/docs/dataartsstudio/umn/en-us_image_0000002269198221.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789664.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198221.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269198253.png b/docs/dataartsstudio/umn/en-us_image_0000002269198253.png new file mode 100644 index 000000000..6e392267b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269198253.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406541.png b/docs/dataartsstudio/umn/en-us_image_0000002269198261.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406541.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198261.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439593.png b/docs/dataartsstudio/umn/en-us_image_0000002269198269.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439593.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198269.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408025.png b/docs/dataartsstudio/umn/en-us_image_0000002269198277.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408025.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198277.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790960.png b/docs/dataartsstudio/umn/en-us_image_0000002269198293.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790960.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198293.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847346.png b/docs/dataartsstudio/umn/en-us_image_0000002269198369.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270847346.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198369.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438069.png b/docs/dataartsstudio/umn/en-us_image_0000002269198449.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305438069.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198449.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846402.png b/docs/dataartsstudio/umn/en-us_image_0000002269198765.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846402.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198765.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406273.png b/docs/dataartsstudio/umn/en-us_image_0000002269198773.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406273.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198773.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439377.png b/docs/dataartsstudio/umn/en-us_image_0000002269198821.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439377.png rename to docs/dataartsstudio/umn/en-us_image_0000002269198821.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439949.png b/docs/dataartsstudio/umn/en-us_image_0000002269199053.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439949.png rename to docs/dataartsstudio/umn/en-us_image_0000002269199053.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269199241.png b/docs/dataartsstudio/umn/en-us_image_0000002269199241.png new file mode 100644 index 000000000..709be938d Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269199241.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269199249.png b/docs/dataartsstudio/umn/en-us_image_0000002269199249.png new file mode 100644 index 000000000..364292f4c Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269199249.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440881.png b/docs/dataartsstudio/umn/en-us_image_0000002269199617.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440881.png rename to docs/dataartsstudio/umn/en-us_image_0000002269199617.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790304.png b/docs/dataartsstudio/umn/en-us_image_0000002269199621.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790304.png rename to docs/dataartsstudio/umn/en-us_image_0000002269199621.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269199961.png b/docs/dataartsstudio/umn/en-us_image_0000002269199961.png new file mode 100644 index 000000000..6cac0a2ab Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269199961.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789752.png b/docs/dataartsstudio/umn/en-us_image_0000002269199973.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789752.png rename to docs/dataartsstudio/umn/en-us_image_0000002269199973.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269199985.png b/docs/dataartsstudio/umn/en-us_image_0000002269199985.png new file mode 100644 index 000000000..45e6357b7 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269199985.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789744.png b/docs/dataartsstudio/umn/en-us_image_0000002269200033.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270789744.png rename to docs/dataartsstudio/umn/en-us_image_0000002269200033.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269200177.png b/docs/dataartsstudio/umn/en-us_image_0000002269200177.png new file mode 100644 index 000000000..81b834fe5 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269200177.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440725.png b/docs/dataartsstudio/umn/en-us_image_0000002269200193.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440725.png rename to docs/dataartsstudio/umn/en-us_image_0000002269200193.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791600.jpg b/docs/dataartsstudio/umn/en-us_image_0000002269200297.jpg similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791600.jpg rename to docs/dataartsstudio/umn/en-us_image_0000002269200297.jpg diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269200561.png b/docs/dataartsstudio/umn/en-us_image_0000002269200561.png new file mode 100644 index 000000000..ae1610b1b Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269200561.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441473.png b/docs/dataartsstudio/umn/en-us_image_0000002269200857.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441473.png rename to docs/dataartsstudio/umn/en-us_image_0000002269200857.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440865.png b/docs/dataartsstudio/umn/en-us_image_0000002269201253.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440865.png rename to docs/dataartsstudio/umn/en-us_image_0000002269201253.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269201633.png b/docs/dataartsstudio/umn/en-us_image_0000002269201633.png new file mode 100644 index 000000000..46cfe9d92 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269201633.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407325.png b/docs/dataartsstudio/umn/en-us_image_0000002269201777.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407325.png rename to docs/dataartsstudio/umn/en-us_image_0000002269201777.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407317.png b/docs/dataartsstudio/umn/en-us_image_0000002269201833.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407317.png rename to docs/dataartsstudio/umn/en-us_image_0000002269201833.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790600.png b/docs/dataartsstudio/umn/en-us_image_0000002269201849.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790600.png rename to docs/dataartsstudio/umn/en-us_image_0000002269201849.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407329.png b/docs/dataartsstudio/umn/en-us_image_0000002269201865.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407329.png rename to docs/dataartsstudio/umn/en-us_image_0000002269201865.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269202017.png b/docs/dataartsstudio/umn/en-us_image_0000002269202017.png new file mode 100644 index 000000000..610e6c762 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269202017.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441101.png b/docs/dataartsstudio/umn/en-us_image_0000002269202165.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441101.png rename to docs/dataartsstudio/umn/en-us_image_0000002269202165.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791272.png b/docs/dataartsstudio/umn/en-us_image_0000002269202721.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791272.png rename to docs/dataartsstudio/umn/en-us_image_0000002269202721.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441077.png b/docs/dataartsstudio/umn/en-us_image_0000002269202729.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441077.png rename to docs/dataartsstudio/umn/en-us_image_0000002269202729.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408021.png b/docs/dataartsstudio/umn/en-us_image_0000002269202797.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408021.png rename to docs/dataartsstudio/umn/en-us_image_0000002269202797.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791276.png b/docs/dataartsstudio/umn/en-us_image_0000002269202825.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791276.png rename to docs/dataartsstudio/umn/en-us_image_0000002269202825.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441097.png b/docs/dataartsstudio/umn/en-us_image_0000002269203809.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441097.png rename to docs/dataartsstudio/umn/en-us_image_0000002269203809.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441549.png b/docs/dataartsstudio/umn/en-us_image_0000002269203933.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305441549.png rename to docs/dataartsstudio/umn/en-us_image_0000002269203933.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408485.jpg b/docs/dataartsstudio/umn/en-us_image_0000002269203941.jpg similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305408485.jpg rename to docs/dataartsstudio/umn/en-us_image_0000002269203941.jpg diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440613.png b/docs/dataartsstudio/umn/en-us_image_0000002269204277.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440613.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204277.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790820.png b/docs/dataartsstudio/umn/en-us_image_0000002269204289.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270790820.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204289.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407553.png b/docs/dataartsstudio/umn/en-us_image_0000002269204293.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407553.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204293.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407381.png b/docs/dataartsstudio/umn/en-us_image_0000002269204349.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407381.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204349.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440661.png b/docs/dataartsstudio/umn/en-us_image_0000002269204489.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440661.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204489.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439425.png b/docs/dataartsstudio/umn/en-us_image_0000002269204497.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439425.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204497.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439429.png b/docs/dataartsstudio/umn/en-us_image_0000002269204741.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305439429.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204741.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846466.png b/docs/dataartsstudio/umn/en-us_image_0000002269204745.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846466.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204745.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846362.png b/docs/dataartsstudio/umn/en-us_image_0000002269204853.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846362.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204853.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407897.png b/docs/dataartsstudio/umn/en-us_image_0000002269204877.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305407897.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204877.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002269204937.png b/docs/dataartsstudio/umn/en-us_image_0000002269204937.png new file mode 100644 index 000000000..27012f002 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002269204937.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846770.png b/docs/dataartsstudio/umn/en-us_image_0000002269204977.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270846770.png rename to docs/dataartsstudio/umn/en-us_image_0000002269204977.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791652.png b/docs/dataartsstudio/umn/en-us_image_0000002269205005.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002270791652.png rename to docs/dataartsstudio/umn/en-us_image_0000002269205005.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440961.png b/docs/dataartsstudio/umn/en-us_image_0000002269205185.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440961.png rename to docs/dataartsstudio/umn/en-us_image_0000002269205185.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440957.png b/docs/dataartsstudio/umn/en-us_image_0000002269205189.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305440957.png rename to docs/dataartsstudio/umn/en-us_image_0000002269205189.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406813.png b/docs/dataartsstudio/umn/en-us_image_0000002269205393.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002305406813.png rename to docs/dataartsstudio/umn/en-us_image_0000002269205393.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270789880.png b/docs/dataartsstudio/umn/en-us_image_0000002270789880.png deleted file mode 100644 index 1671f494d..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270789880.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790152.png b/docs/dataartsstudio/umn/en-us_image_0000002270790152.png deleted file mode 100644 index aa33c96c3..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790152.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790168.png b/docs/dataartsstudio/umn/en-us_image_0000002270790168.png deleted file mode 100644 index c4202d72b..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790168.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790204.png b/docs/dataartsstudio/umn/en-us_image_0000002270790204.png deleted file mode 100644 index 69ae92964..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790204.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790272.png b/docs/dataartsstudio/umn/en-us_image_0000002270790272.png deleted file mode 100644 index f897e8777..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790272.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790352.png b/docs/dataartsstudio/umn/en-us_image_0000002270790352.png deleted file mode 100644 index 34624896e..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790352.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790404.png b/docs/dataartsstudio/umn/en-us_image_0000002270790404.png deleted file mode 100644 index 5c3e06014..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790404.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790548.png b/docs/dataartsstudio/umn/en-us_image_0000002270790548.png deleted file mode 100644 index ff6a010d3..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790548.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790596.png b/docs/dataartsstudio/umn/en-us_image_0000002270790596.png deleted file mode 100644 index 4270ba8c4..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790596.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790648.png b/docs/dataartsstudio/umn/en-us_image_0000002270790648.png deleted file mode 100644 index 0ca533d2e..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790648.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790816.png b/docs/dataartsstudio/umn/en-us_image_0000002270790816.png deleted file mode 100644 index 8228297f9..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790816.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270790856.png b/docs/dataartsstudio/umn/en-us_image_0000002270790856.png deleted file mode 100644 index e880f219b..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270790856.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791184.png b/docs/dataartsstudio/umn/en-us_image_0000002270791184.png deleted file mode 100644 index b74e9290a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270791184.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791360.png b/docs/dataartsstudio/umn/en-us_image_0000002270791360.png deleted file mode 100644 index 8ffa9e03f..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270791360.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791372.png b/docs/dataartsstudio/umn/en-us_image_0000002270791372.png deleted file mode 100644 index b74e9290a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270791372.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791376.png b/docs/dataartsstudio/umn/en-us_image_0000002270791376.png deleted file mode 100644 index b74e9290a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270791376.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791468.png b/docs/dataartsstudio/umn/en-us_image_0000002270791468.png deleted file mode 100644 index 441eb65fb..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270791468.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791636.png b/docs/dataartsstudio/umn/en-us_image_0000002270791636.png deleted file mode 100644 index 548a113cb..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270791636.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791648.png b/docs/dataartsstudio/umn/en-us_image_0000002270791648.png deleted file mode 100644 index 5e9d57f6b..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270791648.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791668.png b/docs/dataartsstudio/umn/en-us_image_0000002270791668.png deleted file mode 100644 index a926d8608..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270791668.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270791672.png b/docs/dataartsstudio/umn/en-us_image_0000002270791672.png deleted file mode 100644 index b74e9290a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270791672.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270844674.png b/docs/dataartsstudio/umn/en-us_image_0000002270844674.png deleted file mode 100644 index ef66bf46b..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270844674.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270844810.png b/docs/dataartsstudio/umn/en-us_image_0000002270844810.png deleted file mode 100644 index 2d903d4a0..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270844810.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270844902.png b/docs/dataartsstudio/umn/en-us_image_0000002270844902.png deleted file mode 100644 index 323d460df..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270844902.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846434.png b/docs/dataartsstudio/umn/en-us_image_0000002270846434.png deleted file mode 100644 index f60d9ca91..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270846434.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846454.png b/docs/dataartsstudio/umn/en-us_image_0000002270846454.png deleted file mode 100644 index 4ee55aa38..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270846454.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846462.png b/docs/dataartsstudio/umn/en-us_image_0000002270846462.png deleted file mode 100644 index 4f9ffd97b..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270846462.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846514.png b/docs/dataartsstudio/umn/en-us_image_0000002270846514.png deleted file mode 100644 index e443f72bd..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270846514.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846582.jpg b/docs/dataartsstudio/umn/en-us_image_0000002270846582.jpg deleted file mode 100644 index 0eb8b1b10..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270846582.jpg and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846790.png b/docs/dataartsstudio/umn/en-us_image_0000002270846790.png deleted file mode 100644 index a0ee61c64..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270846790.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270846830.png b/docs/dataartsstudio/umn/en-us_image_0000002270846830.png deleted file mode 100644 index a926d8608..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270846830.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847046.png b/docs/dataartsstudio/umn/en-us_image_0000002270847046.png deleted file mode 100644 index 2eaa652e8..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270847046.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847066.png b/docs/dataartsstudio/umn/en-us_image_0000002270847066.png deleted file mode 100644 index 5baddd7e3..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270847066.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847106.png b/docs/dataartsstudio/umn/en-us_image_0000002270847106.png deleted file mode 100644 index a620b99af..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270847106.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847126.png b/docs/dataartsstudio/umn/en-us_image_0000002270847126.png deleted file mode 100644 index b9537e4f6..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270847126.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847146.png b/docs/dataartsstudio/umn/en-us_image_0000002270847146.png deleted file mode 100644 index a926d8608..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270847146.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847322.png b/docs/dataartsstudio/umn/en-us_image_0000002270847322.png deleted file mode 100644 index a0ee61c64..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270847322.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847470.png b/docs/dataartsstudio/umn/en-us_image_0000002270847470.png deleted file mode 100644 index a926d8608..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270847470.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270847942.png b/docs/dataartsstudio/umn/en-us_image_0000002270847942.png deleted file mode 100644 index fc826b336..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270847942.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848010.png b/docs/dataartsstudio/umn/en-us_image_0000002270848010.png deleted file mode 100644 index 08adaa17d..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270848010.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848226.png b/docs/dataartsstudio/umn/en-us_image_0000002270848226.png deleted file mode 100644 index 5ca650c70..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270848226.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848266.png b/docs/dataartsstudio/umn/en-us_image_0000002270848266.png deleted file mode 100644 index 0eaed8783..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270848266.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848338.png b/docs/dataartsstudio/umn/en-us_image_0000002270848338.png deleted file mode 100644 index 58b8d7626..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270848338.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270848498.png b/docs/dataartsstudio/umn/en-us_image_0000002270848498.png deleted file mode 100644 index 7d0dc3e72..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270848498.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270921874.png b/docs/dataartsstudio/umn/en-us_image_0000002270921874.png deleted file mode 100644 index 8c1f583ae..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270921874.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002270956052.png b/docs/dataartsstudio/umn/en-us_image_0000002270956052.png deleted file mode 100644 index 838d5cebc..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002270956052.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002271064250.png b/docs/dataartsstudio/umn/en-us_image_0000002271064250.png deleted file mode 100644 index 50c9d4d79..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002271064250.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002271181068.png b/docs/dataartsstudio/umn/en-us_image_0000002271181068.png deleted file mode 100644 index d921dea18..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002271181068.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002271689457.png b/docs/dataartsstudio/umn/en-us_image_0000002271689457.png new file mode 100644 index 000000000..dc4d3de4c Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002271689457.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002271691905.png b/docs/dataartsstudio/umn/en-us_image_0000002271691905.png new file mode 100644 index 000000000..5142e68a0 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002271691905.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002271769549.png b/docs/dataartsstudio/umn/en-us_image_0000002271769549.png new file mode 100644 index 000000000..59ee0b888 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002271769549.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405125.png b/docs/dataartsstudio/umn/en-us_image_0000002305405125.png deleted file mode 100644 index 2e120b4d7..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305405125.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305405681.png b/docs/dataartsstudio/umn/en-us_image_0000002305405681.png deleted file mode 100644 index 4a648918d..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305405681.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406441.png b/docs/dataartsstudio/umn/en-us_image_0000002305406441.png deleted file mode 100644 index 6c099cfea..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406441.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406445.png b/docs/dataartsstudio/umn/en-us_image_0000002305406445.png deleted file mode 100644 index 8b1e94d9f..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406445.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406449.png b/docs/dataartsstudio/umn/en-us_image_0000002305406449.png deleted file mode 100644 index 7e4d40185..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406449.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406469.png b/docs/dataartsstudio/umn/en-us_image_0000002305406469.png deleted file mode 100644 index b74e9290a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406469.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406493.png b/docs/dataartsstudio/umn/en-us_image_0000002305406493.png deleted file mode 100644 index 0f0140f68..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406493.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406533.png b/docs/dataartsstudio/umn/en-us_image_0000002305406533.png deleted file mode 100644 index 16c54b83e..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406533.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406693.png b/docs/dataartsstudio/umn/en-us_image_0000002305406693.png deleted file mode 100644 index a926d8608..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406693.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406817.png b/docs/dataartsstudio/umn/en-us_image_0000002305406817.png deleted file mode 100644 index a05812536..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406817.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406901.png b/docs/dataartsstudio/umn/en-us_image_0000002305406901.png deleted file mode 100644 index 6a895a9e4..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406901.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305406993.png b/docs/dataartsstudio/umn/en-us_image_0000002305406993.png deleted file mode 100644 index 5272c02c4..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305406993.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407013.png b/docs/dataartsstudio/umn/en-us_image_0000002305407013.png deleted file mode 100644 index 252bc39fb..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407013.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407201.png b/docs/dataartsstudio/umn/en-us_image_0000002305407201.png deleted file mode 100644 index 2be05c86b..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407201.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407205.png b/docs/dataartsstudio/umn/en-us_image_0000002305407205.png deleted file mode 100644 index 2be05c86b..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407205.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407345.png b/docs/dataartsstudio/umn/en-us_image_0000002305407345.png deleted file mode 100644 index 51bc3cf43..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407345.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407361.png b/docs/dataartsstudio/umn/en-us_image_0000002305407361.png deleted file mode 100644 index 5e9d57f6b..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407361.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407397.png b/docs/dataartsstudio/umn/en-us_image_0000002305407397.png deleted file mode 100644 index f10b490d1..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407397.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407545.png b/docs/dataartsstudio/umn/en-us_image_0000002305407545.png deleted file mode 100644 index 0348ca8e6..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407545.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407821.png b/docs/dataartsstudio/umn/en-us_image_0000002305407821.png deleted file mode 100644 index 98d5a110c..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407821.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407917.png b/docs/dataartsstudio/umn/en-us_image_0000002305407917.png deleted file mode 100644 index b74e9290a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407917.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305407921.png b/docs/dataartsstudio/umn/en-us_image_0000002305407921.png deleted file mode 100644 index b74e9290a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305407921.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408141.png b/docs/dataartsstudio/umn/en-us_image_0000002305408141.png deleted file mode 100644 index 0eaed8783..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305408141.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408269.png b/docs/dataartsstudio/umn/en-us_image_0000002305408269.png deleted file mode 100644 index 37c23e95f..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305408269.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408373.png b/docs/dataartsstudio/umn/en-us_image_0000002305408373.png deleted file mode 100644 index f8555ff19..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305408373.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408377.png b/docs/dataartsstudio/umn/en-us_image_0000002305408377.png deleted file mode 100644 index 0fde13ff3..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305408377.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305408409.png b/docs/dataartsstudio/umn/en-us_image_0000002305408409.png deleted file mode 100644 index a926d8608..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305408409.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305438189.png b/docs/dataartsstudio/umn/en-us_image_0000002305438189.png deleted file mode 100644 index f43e0743e..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305438189.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439409.png b/docs/dataartsstudio/umn/en-us_image_0000002305439409.png deleted file mode 100644 index 47c58d4cb..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305439409.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439505.png b/docs/dataartsstudio/umn/en-us_image_0000002305439505.png deleted file mode 100644 index 5adefb505..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305439505.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439541.png b/docs/dataartsstudio/umn/en-us_image_0000002305439541.png deleted file mode 100644 index b74e9290a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305439541.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439557.png b/docs/dataartsstudio/umn/en-us_image_0000002305439557.png deleted file mode 100644 index 359393e3e..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305439557.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439645.png b/docs/dataartsstudio/umn/en-us_image_0000002305439645.png deleted file mode 100644 index 07ded6e03..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305439645.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439681.png b/docs/dataartsstudio/umn/en-us_image_0000002305439681.png deleted file mode 100644 index a926d8608..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305439681.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439865.png b/docs/dataartsstudio/umn/en-us_image_0000002305439865.png deleted file mode 100644 index 36b728818..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305439865.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305439969.png b/docs/dataartsstudio/umn/en-us_image_0000002305439969.png deleted file mode 100644 index b31c90053..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305439969.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440273.png b/docs/dataartsstudio/umn/en-us_image_0000002305440273.png deleted file mode 100644 index 7391d1296..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305440273.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440405.png b/docs/dataartsstudio/umn/en-us_image_0000002305440405.png deleted file mode 100644 index 40de7ba3a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305440405.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440477.png b/docs/dataartsstudio/umn/en-us_image_0000002305440477.png deleted file mode 100644 index a5209fd63..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305440477.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305440837.png b/docs/dataartsstudio/umn/en-us_image_0000002305440837.png deleted file mode 100644 index 0d732e7c3..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305440837.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441177.png b/docs/dataartsstudio/umn/en-us_image_0000002305441177.png deleted file mode 100644 index b74e9290a..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305441177.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441209.png b/docs/dataartsstudio/umn/en-us_image_0000002305441209.png deleted file mode 100644 index 9eb5c5275..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305441209.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441221.png b/docs/dataartsstudio/umn/en-us_image_0000002305441221.png deleted file mode 100644 index 7bb697d1e..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305441221.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441289.png b/docs/dataartsstudio/umn/en-us_image_0000002305441289.png deleted file mode 100644 index a620b99af..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305441289.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305441437.png b/docs/dataartsstudio/umn/en-us_image_0000002305441437.png deleted file mode 100644 index 2188bed58..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305441437.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305717785.png b/docs/dataartsstudio/umn/en-us_image_0000002305717785.png deleted file mode 100644 index ef7245f43..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305717785.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002305833085.png b/docs/dataartsstudio/umn/en-us_image_0000002305833085.png deleted file mode 100644 index efb8e4433..000000000 Binary files a/docs/dataartsstudio/umn/en-us_image_0000002305833085.png and /dev/null differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002390854012.png b/docs/dataartsstudio/umn/en-us_image_0000002390854012.png new file mode 100644 index 000000000..f47c2335d Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002390854012.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002391028724.png b/docs/dataartsstudio/umn/en-us_image_0000002391028724.png new file mode 100644 index 000000000..f47c2335d Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002391028724.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002424389693.png b/docs/dataartsstudio/umn/en-us_image_0000002424389693.png new file mode 100644 index 000000000..2e5e701bc Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002424389693.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002424390041.png b/docs/dataartsstudio/umn/en-us_image_0000002424390041.png new file mode 100644 index 000000000..b575292e6 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002424390041.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002271461758.png b/docs/dataartsstudio/umn/en-us_image_0000002424391613.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002271461758.png rename to docs/dataartsstudio/umn/en-us_image_0000002424391613.png diff --git a/docs/dataartsstudio/umn/en-us_image_0000002424391793.png b/docs/dataartsstudio/umn/en-us_image_0000002424391793.png new file mode 100644 index 000000000..51bc0e4e7 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002424391793.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002424392261.png b/docs/dataartsstudio/umn/en-us_image_0000002424392261.png new file mode 100644 index 000000000..74bb072dc Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002424392261.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002424508617.png b/docs/dataartsstudio/umn/en-us_image_0000002424508617.png new file mode 100644 index 000000000..f47c2335d Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002424508617.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002424509573.png b/docs/dataartsstudio/umn/en-us_image_0000002424509573.png new file mode 100644 index 000000000..71e5fcfa9 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002424509573.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002424510233.png b/docs/dataartsstudio/umn/en-us_image_0000002424510233.png new file mode 100644 index 000000000..b575292e6 Binary files /dev/null and b/docs/dataartsstudio/umn/en-us_image_0000002424510233.png differ diff --git a/docs/dataartsstudio/umn/en-us_image_0000002271193404.png b/docs/dataartsstudio/umn/en-us_image_0000002424511029.png similarity index 100% rename from docs/dataartsstudio/umn/en-us_image_0000002271193404.png rename to docs/dataartsstudio/umn/en-us_image_0000002424511029.png diff --git a/docs/dataartsstudio/umn/en-us_topic_0000002270788944.html b/docs/dataartsstudio/umn/en-us_topic_0000002270788944.html deleted file mode 100644 index 82a9cad84..000000000 --- a/docs/dataartsstudio/umn/en-us_topic_0000002270788944.html +++ /dev/null @@ -1,42 +0,0 @@ - - -

                                                                            Tags

                                                                            -

                                                                            A tag is a key-value pair that identifies an instance. It consists of a key and a value.

                                                                            -

                                                                            DataArts Studio instance tags can be used in the following scenarios:

                                                                            -
                                                                            • If there are a large number of cloud resources, you can add tags to them (including DataArts Studio instances) by user, maintainer, or usage. Then you can use Tag Management Service (TMS) to identify tags and manage cloud resources easily.
                                                                            • If there are multiple DataArts Studio instances, you can add tags to them by user, maintainer, or usage. Then you can search for and identify DataArts Studio instances by tag on the DataArts Studio instance list page.
                                                                            -

                                                                            Constraints

                                                                            • A DataArts Studio instance can have a maximum of 20 tags.
                                                                            • Each tag key must be unique. Only one tag value can be added to a tag key.
                                                                            -
                                                                            -

                                                                            Procedure

                                                                            1. Log in to the DataArts Studio console by following the instructions in Accessing the DataArts Studio Instance Console.
                                                                            2. On the Tags page, click Add/Edit Tag. In the displayed dialog box, set parameters. Enter a tag key and a value, and click Add.

                                                                              Figure 1 Adding/Editing tags
                                                                              - -
                                                                              - - - - - - - - - - -
                                                                              Table 1 Tag parameters

                                                                              Parameter

                                                                              -

                                                                              Description

                                                                              -

                                                                              Tag Key

                                                                              -
                                                                              DataArts Studio supports predefined tags and resource tags.
                                                                              • Predefined tags are created on TMS. They may suit your needs to manage multiple services by tag.

                                                                                To use a predefined tag, you must create one on TMS first. Then you can select it from the Tag key drop-down list. You can click View predefined tags to enter the Predefined Tag page of TMS. Then, click Create Tag to create a predefined tag. For details, see Creating Predefined Tags in Tag Management Service User Guide.

                                                                                -
                                                                              • Resource tags are created when you add a tag. You do not need to define them in advance. Resource tags are suitable for you to manage DataArts Studio instances by tag.

                                                                                To use a resource tag, you can enter the tag key in the box. The tag key can contain a maximum of 128 characters, including uppercase letters, lowercase letters, digits, spaces, and the following special characters: _.:=+-@. The tag key cannot start with a space or _sys_, or end with a space.

                                                                                -
                                                                              -
                                                                              -

                                                                              Tag Value

                                                                              -

                                                                              You can specify the tag value in either of the following ways:

                                                                              -
                                                                              • Predefined tags: Click the text box and select a predefined tag value from the drop-down list.
                                                                              • Resource tags: Enter a tag value in the text box. The tag value can contain a maximum of 255 characters, including uppercase letters, lowercase letters, digits, spaces, and the following special characters: _.:=+-@. The tag value cannot start or end with a space.
                                                                              -
                                                                              -
                                                                              -

                                                                            -
                                                                            -
                                                                            -
                                                                            - -
                                                                            - diff --git a/docs/dataartsstudio/umn/en-us_topic_0000002270846046.html b/docs/dataartsstudio/umn/en-us_topic_0000002270846046.html deleted file mode 100644 index d57bf75c5..000000000 --- a/docs/dataartsstudio/umn/en-us_topic_0000002270846046.html +++ /dev/null @@ -1,18 +0,0 @@ - - -

                                                                            Management Console

                                                                            -

                                                                            -
                                                                            -
                                                                            - - - -
                                                                            - diff --git a/docs/dataartsstudio/umn/public_sys-resources/imageclose.gif b/docs/dataartsstudio/umn/public_sys-resources/imageclose.gif new file mode 100644 index 000000000..3a3344af4 Binary files /dev/null and b/docs/dataartsstudio/umn/public_sys-resources/imageclose.gif differ diff --git a/docs/dataartsstudio/umn/public_sys-resources/imageclosehover.gif b/docs/dataartsstudio/umn/public_sys-resources/imageclosehover.gif new file mode 100644 index 000000000..8699d5e36 Binary files /dev/null and b/docs/dataartsstudio/umn/public_sys-resources/imageclosehover.gif differ diff --git a/docs/dataartsstudio/umn/public_sys-resources/imagemax.gif b/docs/dataartsstudio/umn/public_sys-resources/imagemax.gif new file mode 100644 index 000000000..99c07dc25 Binary files /dev/null and b/docs/dataartsstudio/umn/public_sys-resources/imagemax.gif differ diff --git a/docs/dataartsstudio/umn/public_sys-resources/imagemaxhover.gif b/docs/dataartsstudio/umn/public_sys-resources/imagemaxhover.gif new file mode 100644 index 000000000..d01d77d6e Binary files /dev/null and b/docs/dataartsstudio/umn/public_sys-resources/imagemaxhover.gif differ diff --git a/docs/dataartsstudio/umn/public_sys-resources/macFFBgHack.png b/docs/dataartsstudio/umn/public_sys-resources/macFFBgHack.png new file mode 100644 index 000000000..ec811470c Binary files /dev/null and b/docs/dataartsstudio/umn/public_sys-resources/macFFBgHack.png differ