Skip to content

Commit 27e3541

Browse files
committed
EOD backup
1 parent f3d541a commit 27e3541

File tree

2 files changed

+42
-15
lines changed

2 files changed

+42
-15
lines changed

purview/lineage/palsa/README.md

Lines changed: 11 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -11,9 +11,15 @@ chmod +x openlineage-deployment.sh
1111
cd -
1212
```
1313

14-
Connect with existing
15-
```
16-
17-
./standalone.sh
14+
## Deploy option 2: Connect with existing
15+
1. Run `./standalone.sh deploy`
16+
2. Add the service principal `Purview-ADB-Lineage-Solution-Accelerator` to the `Data Curator` role in your Purview resource.
17+
- `Data Map` > `Domains` > select the Purview instance > `Role assignments`
18+
3. Install necessary types into your Purview instance
19+
```
20+
`./standalone.sh config-purview`
21+
TODO troubleshoot
22+
```
1823
19-
```
24+
4. TODO
25+
https://github.com/microsoft/Purview-ADB-Lineage-Solution-Accelerator/blob/release/2.3/deploy-base.md#download-the-openlineage-spark-agent-and-configure-with-your-azure-databricks-clusters
Lines changed: 31 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
set -e
2+
23
if ! [ -f ./common.sh ]; then
34
curl https://raw.githubusercontent.com/davidkhala/Microsoft/refs/heads/main/purview/lineage/palsa/common.sh -O
45
source ./common.sh
@@ -7,6 +8,34 @@ else
78
source ./common.sh
89
fi
910

11+
purviewName=$(curl https://raw.githubusercontent.com/davidkhala/azure-utils/refs/heads/main/cli/purview.sh | bash -s name)
12+
13+
deploy() {
14+
curl https://raw.githubusercontent.com/microsoft/Purview-ADB-Lineage-Solution-Accelerator/refs/heads/release/2.3/deployment/infra/newdeploymenttemp.json -O
15+
16+
az deployment group create --resource-group $rg --template-file "./newdeploymenttemp.json" --parameters purviewName=$purviewName prefixName= clientid=$clientid clientsecret=$clientsecret resourceTagValues={} --output none
17+
# if failure, clean up by `az deployment group delete --name newdeploymenttemp --resource-group $rg`
18+
rm newdeploymenttemp.json
19+
}
20+
21+
# Install necessary types into your Purview instance
22+
config-purview() {
23+
purview_endpoint="https://$purviewName.purview.azure.com"
24+
25+
tenantid=$(curl https://raw.githubusercontent.com/davidkhala/azure-utils/refs/heads/main/cli/context.sh | bash -s tenant)
26+
27+
local login_endpoint="https://login.microsoftonline.com/$tenantid/oauth2/token"
28+
acc_purview_token=$(curl $login_endpoint --data "resource=https://purview.azure.net&client_id=$clientid&client_secret=$clientsecret&grant_type=client_credentials" -H Metadata:true -s | jq -r '.access_token')
29+
30+
curl https://raw.githubusercontent.com/microsoft/Purview-ADB-Lineage-Solution-Accelerator/refs/heads/release/2.3/deployment/infra/Custom_Types.json -O
31+
32+
curl -s -X POST $purview_endpoint/catalog/api/atlas/v2/types/typedefs -H "Authorization: Bearer $acc_purview_token" -H "Content-Type: application/json" -d @Custom_Types.json
33+
# TODO troubleshoot error
34+
# {"requestId":"d1fb3a39-9016-44c0-9a7a-8164419d4188","errorCode":"ATLAS-400-00-01A","errorMessage":"invalid parameters: invalid payload, expect schemaAttributes in purview_custom_connector_generic_column should be list of string, but found: data_type"}
35+
rm Custom_Types.json
36+
}
37+
38+
# TODO databricks part
1039
if ! unzip -v; then
1140
echo "unzip is required. Please find and install on your OS"
1241
exit 1
@@ -16,13 +45,5 @@ if ! databricks -v; then
1645
# install DataBricks CLI
1746
curl -fsSL https://raw.githubusercontent.com/databricks/setup-cli/main/install.sh | sudo sh
1847
fi
19-
20-
rg=${rg:-"Purview-ADB-Lineage-Solution-Accelerator"}
21-
purviewName=$(curl https://raw.githubusercontent.com/davidkhala/azure-utils/refs/heads/main/cli/purview.sh | bash -s name)
22-
23-
# DEBUG
24-
curl https://raw.githubusercontent.com/microsoft/Purview-ADB-Lineage-Solution-Accelerator/refs/heads/release/2.3/deployment/infra/newdeploymenttemp.json -O
25-
26-
az deployment group create --resource-group $rg --template-file "./newdeploymenttemp.json" --parameters purviewName=$purviewName prefixName= clientid=$clientid clientsecret=$clientsecret resourceTagValues={} --output none
27-
# if failure, clean up by `az deployment group delete --name newdeploymenttemp --resource-group $rg`
28-
rm newdeploymenttemp.json
48+
# TODO databricks part
49+
$@

0 commit comments

Comments
 (0)