Dave Ruijter DaveRuijter

## pipeline-backup-weekly.yml
parameters:
  - name: backupStore
    displayName: 'Backup 05 store'
    type: boolean
    default: true
  - name: backupBronze
    displayName: 'Backup 10 bronze'
    type: boolean
    default: true
  - name: backupSilver

## pipeline-backup-daily.yml
parameters:
  - name: backupStore
    displayName: 'Backup 05 store'
    type: boolean
    default: true
  - name: backupBronze
    displayName: 'Backup 10 bronze'
    type: boolean
    default: true
  - name: backupSilver

## job-backup-dls.yml
parameters:
  - name: backups
    displayName: 'Array of backups'
    type: object
    default: []
  - name: serviceConnectionName
    displayName: 'Name of the DevOps Service Connection'
    type: string
  - name: execute
    displayName: 'Execute this Job'

## is_pipeline_running.json
{
	"name": "00_is_pipeline_running",
	"properties": {
		"activities": [
			{
				"name": "Get Pipeline Runs",
				"type": "WebActivity",
				"dependsOn": [
					{
						"activity": "getSubscriptionID",

## multicolumn_expression_evaluation.py
from great_expectations.expectations.expectation import MulticolumnMapExpectation
from great_expectations.expectations.util import render_evaluation_parameter_string
from great_expectations.render.util import (
    num_to_str,
    substitute_none_for_missing,
    parse_row_condition_string_pandas_engine,
)
from scipy import stats as stats
from great_expectations.execution_engine import (
    PandasExecutionEngine,

## generate_hash.py

spark.udf.register("udf_removehtmltagsfromstring", udf_removehtmltagsfromstring, "string")

# This is the central hashing function, used by other functions. It uses the blake2b hashing algorithm. With a central function, we can adjust the hashing when needed.
def udf_centralhash(string: str) -> int:
    val = hashlib.blake2b(
        digest_size=6
    )  # Increase digest size to make the hashing bigger. 6 seems a good start for our use for dimensions.
    val.update(string.encode("utf-8"))  # give the input string as utf-8 to the blake2b object
    intval = int(val.hexdigest(), 16)  # and convert it to an integer

## AddServicePrincipalToPowerBIWorkspaces.ps1
# =================================================================================================================================================
## This script will add the given Service Principal to Power BI workspaces
## It will first ask for the (correct) ObjectId of the Service Principal
## Then it will ask for the credentials of a Power BI Service Administrator

## Note: this script only works with v2 workspaces (you can't add a Service Principal to a v1 workspace)
# =================================================================================================================================================

## Parameters

## pipeline-release-administration.yml
trigger:
  - main
  - master

pool:
  vmImage: ubuntu-latest

## Job to create release and add tag
jobs:
  - job: CalculateVersion

## gitversion.yml
next-version: 1.0
assembly-versioning-scheme: MajorMinorPatch
assembly-file-versioning-scheme: MajorMinorPatchTag
assembly-informational-format: '{InformationalVersion}'
mode: ContinuousDelivery
increment: Inherit
continuous-delivery-fallback-tag: ci
tag-prefix: '[vV]'
major-version-bump-message: '\+semver:\s?(breaking|major)'
minor-version-bump-message: '\+semver:\s?(feature|minor)'

## pl_PBI_dataset_refresh.json
{
    "name": "pipeline1",
    "properties": {
        "activities": [
            {
                "name": "Call dataset refresh",
                "type": "WebActivity",
                "dependsOn": [
                    {
                        "activity": "Get AAD Token",
	parameters:
	- name: backupStore
	displayName: 'Backup 05 store'
	type: boolean
	default: true
	- name: backupBronze
	displayName: 'Backup 10 bronze'
	type: boolean
	default: true
	- name: backupSilver
	parameters:
	- name: backups
	displayName: 'Array of backups'
	type: object
	default: []
	- name: serviceConnectionName
	displayName: 'Name of the DevOps Service Connection'
	type: string
	- name: execute
	displayName: 'Execute this Job'
	{
	"name": "00_is_pipeline_running",
	"properties": {
	"activities": [
	{
	"name": "Get Pipeline Runs",
	"type": "WebActivity",
	"dependsOn": [
	{
	"activity": "getSubscriptionID",
	from great_expectations.expectations.expectation import MulticolumnMapExpectation
	from great_expectations.expectations.util import render_evaluation_parameter_string
	from great_expectations.render.util import (
	num_to_str,
	substitute_none_for_missing,
	parse_row_condition_string_pandas_engine,
	)
	from scipy import stats as stats
	from great_expectations.execution_engine import (
	PandasExecutionEngine,

	spark.udf.register("udf_removehtmltagsfromstring", udf_removehtmltagsfromstring, "string")

	# This is the central hashing function, used by other functions. It uses the blake2b hashing algorithm. With a central function, we can adjust the hashing when needed.
	def udf_centralhash(string: str) -> int:
	val = hashlib.blake2b(
	digest_size=6
	) # Increase digest size to make the hashing bigger. 6 seems a good start for our use for dimensions.
	val.update(string.encode("utf-8")) # give the input string as utf-8 to the blake2b object
	intval = int(val.hexdigest(), 16) # and convert it to an integer
	# =================================================================================================================================================
	## This script will add the given Service Principal to Power BI workspaces
	## It will first ask for the (correct) ObjectId of the Service Principal
	## Then it will ask for the credentials of a Power BI Service Administrator

	## Note: this script only works with v2 workspaces (you can't add a Service Principal to a v1 workspace)
	# =================================================================================================================================================

	## Parameters
	trigger:
	- main
	- master

	pool:
	vmImage: ubuntu-latest

	## Job to create release and add tag
	jobs:
	- job: CalculateVersion
	next-version: 1.0
	assembly-versioning-scheme: MajorMinorPatch
	assembly-file-versioning-scheme: MajorMinorPatchTag
	assembly-informational-format: '{InformationalVersion}'
	mode: ContinuousDelivery
	increment: Inherit
	continuous-delivery-fallback-tag: ci
	tag-prefix: '[vV]'
	major-version-bump-message: '\+semver:\s?(breaking\|major)'
	minor-version-bump-message: '\+semver:\s?(feature\|minor)'
	{
	"name": "pipeline1",
	"properties": {
	"activities": [
	{
	"name": "Call dataset refresh",
	"type": "WebActivity",
	"dependsOn": [
	{
	"activity": "Get AAD Token",