Tutorial: How to Deploy a Linux VM in Microsoft Azure Cloud

Tutorial: How to Deploy a Linux VM in Microsoft Azure Cloud

6 January 2023

Guilherme Melo

In this article, we will learn how to deploy a Linux VM instance in Microsoft Azure Cloud using Terraform. We will create a step-by-step deployment of a Linux virtual machine with extra disks using Terraform to guide and optimize the deployment process.

Requirements

  • Credentials of a Service Principal who will execute Terraform code;
  • Create a Resource Group
  • Create a Virtual Network and Subnet
  • Create a Shared Image or Image

Tree Structure

Creating a Terraform file for Azure authentication

First, we will create a file called provider.tf to be used by Azure authentication.

We will need a Subscription ID, Tenant ID, Service Principal ID, and the Secret of the Service Principal.

Add the following code to the file and fill in the inputs:

 

terraform {
 required_providers {
   azurerm = {
     source = "hashicorp/azurerm"
     version = "3.30.0"
   }
 }
}
 
provider "azurerm" {
 subscription_id   = "<azure_subscription_id>"
 tenant_id         = "<azure_subscription_tenant_id>"
 client_id         = "<service_principal_appid>"
 client_secret     = "<service_principal_password>"
}

The version in the required_providers azurerm section is useful to pin a specific version, but is not required.

Creating a Terraform file for Linux VM

Now, create the compute.tf file to build the Azure VM Instance. We will split the code for better clarity. Initially, we will fetch Data of the previously created Resource Group and Subnet.

 

data "azurerm_resource_group" "rg" {
 name = var.rg_name
}
 
data "azurerm_subnet" "sub" {
 name                 = var.subnet_name
 virtual_network_name = var.vnet_name
 resource_group_name  = var.rg_name
}

This section of code will create a Network Interface and assign a Public IP (if necessary).

 

resource "azurerm_public_ip" "pip" {
 count = var.private_ip_address == null ? 1 : 0
 
 name                = "pip-${var.vm_name}"
 resource_group_name = data.azurerm_resource_group.rg.name
 location            = var.location
 allocation_method   = var.public_ip_allocation
 sku                 = "Standard"
 
 tags = var.tags
}
 
resource "azurerm_network_interface" "nic" {
 name                = "nic-${var.vm_name}"
 location            = var.location
 resource_group_name = data.azurerm_resource_group.rg.name
 
 ip_configuration {
   name                          = "internal"
   private_ip_address_allocation = var.private_ip_address == null ? "Dynamic" : "Static"
   private_ip_address_version    = "IPv4"
   subnet_id                     = data.azurerm_subnet.sub.id
   private_ip_address            = var.private_ip_address
   public_ip_address_id          = var.private_ip_address == null ? join("", azurerm_public_ip.pip.*.id) : null
 }
 tags = var.tags
}

This section of code will create the VM Instance.

 

resource "azurerm_linux_virtual_machine" "vm" {
 name                     = var.vm_name
 location                 = var.location
 resource_group_name      = data.azurerm_resource_group.rg.name
 size                     = var.vm_size
 admin_username           = var.username
 admin_password           = var.password
 network_interface_ids    = [azurerm_network_interface.nic.id]
  os_disk {
   caching                = "ReadWrite"
   storage_account_type   = var.bootdisk_type
   disk_size_gb           = var.bootdisk_size
 }
 
 source_image_reference {
     publisher = var.image.os_publisher
     offer     = var.image.os_offer
     sku       = var.image.os_sku
     version   = var.image.os_version
 }
 
 boot_diagnostics {
   #When empty utilize a Platform-Managed Storage Account.
 }
 
 identity {
   type = "SystemAssigned"
 }
 
 tags = var.tags
 
 depends_on = [azurerm_network_interface.nic]
}

Finally, this section of code will create Managed Disks and attach to the VM.

 

resource "azurerm_managed_disk" "disk" {
 for_each = var.managed_disk
 
 name                   = "${var.vm_name}-${each.value.name}"
 location               = var.location
 resource_group_name    = data.azurerm_resource_group.rg.name
 storage_account_type   = each.value.disk_type
 create_option          = "Empty"
 disk_size_gb           = each.value.disk_size
 
 depends_on = [azurerm_windows_virtual_machine.vm]
}
 
resource "azurerm_virtual_machine_data_disk_attachment" "atch" {
 for_each = azurerm_managed_disk.disk
 
 managed_disk_id    = each.value.id
 virtual_machine_id = azurerm_windows_virtual_machine.vm.id
 lun                = index(keys(azurerm_managed_disk.disk), each.key)
 caching            = "ReadWrite"
 
 depends_on = [azurerm_managed_disk.disk]
}

Creating a Terraform file for variables

In this step, we will create the file variables.tf to configure the variables.

Add the following code to the file:

 

##Data Variables##
variable "rg_name" {
 type = string
}
 
variable "vnet_name" {
 type = string
}
 
variable "subnet_name" {
 type = string
}
 
##NIC Variables##
variable "public_ip_allocation" {
 type = string
}
 
variable "private_ip_address" {
 type = string
}
 
##Compute Variables##
variable "location" {
 type = string
}
 
variable "vm_name" {
 type = string
}
 
variable "vm_size" {
 type = string
}
 
variable "username" {
 type = string
}
 
variable "password" {
 type = string
}
 
variable "bootdisk_size" {
 type = string
}
 
variable "bootdisk_type" {
 type = string
}
 
variable "image" {
 type = object({
   os_publisher = string
   os_offer     = string
   os_sku       = string
   os_version   = string
 })
 default = {
   os_offer     = null
   os_publisher = null
   os_sku       = null
   os_version   = null
 }
}
 
##Disks Variables##
variable "managed_disk" {
 default = {}
 
 type = map(object({
   name      = string
   disk_type = string
   disk_size = number
 }))
}
 
variable "tags" {
 type = map(string)
}

Input definition variables

We can define the variables that we created before by creating a .tfvars file, a module, or by using Terraform Cloud.

How to find Ubuntu VM image references for Terraform

There are two options to find Ubunty VM image references:

You can open the AZ CLI tool or the Cloud Shell in the Azure Console and enter the following command:

az vm image list –offer Ubuntu

Alternatively, you can access the Azure VM Image List.

Optional: bootstrapping the VM instance with Bash

We can also use a Bash script to bootstrap the VM instance. This extra step is useful to avoid having to manually mount the disks.

resource "azurerm_virtual_machine_extension" "disk_formatter" {
 count = azurerm_managed_disk.disk != {} ? 1 : 0
 
 name                 = "CustomScript"
 virtual_machine_id   = azurerm_linux_virtual_machine.vm.id
 publisher            = "Microsoft.Azure.Extensions"
 type                 = "CustomScript"
 type_handler_version = "2.1.1"
 protected_settings   = <<-PROTECTED_SETTINGS
 {
   "script": "#!/bin/bash

help()
{
    echo "Usage: $(basename $0) [-b data_base] [-h] [-s] [-o mount_options]"
    echo ""
    echo "Options:"
    echo "   -b         base directory for mount points (default: /datadisks)"
    echo "   -h         this help message"
    echo "   -s         create a striped RAID array (no redundancy)"
    echo "   -o         mount options for data disk"
}

log()
{

    echo "$1"
}

if [ "${UID}" -ne 0 ];
then
    log "Script executed without root permissions"
    echo "You must be root to run this program." >&2
    exit 3
fi

# Base path for data disk mount points
DATA_BASE="/datadisks"
# Mount options for data disk
MOUNT_OPTIONS="noatime,nodiratime,nodev,noexec,nosuid,nofail"
# Determines wheter partition and format data disks as raid set or not
RAID_CONFIGURATION=0

while getopts b:sho: optname; do
    log "Option $optname set with value ${OPTARG}"
  case ${optname} in
    b)  #set clsuter name
      DATA_BASE=${OPTARG}
      ;;
    s) #Partition and format data disks as raid set
      RAID_CONFIGURATION=1
      ;;
    o) #mount option
      MOUNT_OPTIONS=${OPTARG}
      ;;
    h)  #show help
      help
      exit 2
      ;;
    \?) #unrecognized option - show help
      echo -e \\n"Option -${BOLD}$OPTARG${NORM} not allowed."
      help
      exit 2
      ;;
  esac
done

get_next_md_device() {
    shopt -s extglob
    LAST_DEVICE=$(ls -1 /dev/md+([0-9]) 2>/dev/null|sort -n|tail -n1)
    if [ -z "${LAST_DEVICE}" ]; then
        NEXT=/dev/md0
    else
        NUMBER=$((${LAST_DEVICE/\/dev\/md/}))
        NEXT=/dev/md${NUMBER}
    fi
    echo ${NEXT}
}

is_partitioned() {
    OUTPUT=$(partx -s ${1} 2>&1)
    egrep "partition table does not contains usable partitions|failed to read partition table" <<< "${OUTPUT}" >/dev/null 2>&1
    if [ ${?} -eq 0 ]; then
        return 1
    else
        return 0
    fi
}

has_filesystem() {
    DEVICE=${1}
    OUTPUT=$(file -L -s ${DEVICE})
    grep filesystem <<< "${OUTPUT}" > /dev/null 2>&1
    return ${?}
}

scan_for_new_disks() {
    # Looks for unpartitioned disks
    declare -a RET
    DEVS=($(ls -1 /dev/sd*|egrep -v "[0-9]$"))
    for DEV in "${DEVS[@]}";
    do
        # The disk will be considered a candidate for partitioning
        # and formatting if it does not have a sd?1 entry or
        # if it does have an sd?1 entry and does not contain a filesystem
        is_partitioned "${DEV}"
        if [ ${?} -eq 0 ];
        then
            has_filesystem "${DEV}1"
            if [ ${?} -ne 0 ];
            then
                RET+=" ${DEV}"
            fi
        else
            RET+=" ${DEV}"
        fi
    done
    echo "${RET}"
}

get_next_mountpoint() {
    DIRS=$(ls -1d ${DATA_BASE}/disk* 2>/dev/null| sort --version-sort)
    MAX=$(echo "${DIRS}"|tail -n 1 | tr -d "[a-zA-Z/]")
    if [ -z "${MAX}" ];
    then
        echo "${DATA_BASE}/disk1"
        return
    fi
    IDX=1
    while [ "${IDX}" -lt "${MAX}" ];
    do
        NEXT_DIR="${DATA_BASE}/disk${IDX}"
        if [ ! -d "${NEXT_DIR}" ];
        then
            echo "${NEXT_DIR}"
            return
        fi
        IDX=$(( ${IDX} + 1 ))
    done
    IDX=$(( ${MAX} + 1))
    echo "${DATA_BASE}/disk${IDX}"
}

add_to_fstab() {
    UUID=${1}
    MOUNTPOINT=${2}
    grep "${UUID}" /etc/fstab >/dev/null 2>&1
    if [ ${?} -eq 0 ];
    then
        echo "Not adding ${UUID} to fstab again (it's already there!)"
    else
        LINE="UUID=\"${UUID}\"\t${MOUNTPOINT}\text4\t${MOUNT_OPTIONS}\t1 2"
        echo -e "${LINE}" >> /etc/fstab
    fi
}

do_partition() {
# This function creates one (1) primary partition on the
# disk, using all available space
    _disk=${1}
    _type=${2}
    if [ -z "${_type}" ]; then
        # default to Linux partition type (ie, ext3/ext4/xfs)
        _type=83
    fi
    echo "n
p
1


t
${_type}
w"| fdisk "${_disk}"

#
# Use the bash-specific $PIPESTATUS to ensure we get the correct exit code
# from fdisk and not from echo
if [ ${PIPESTATUS[1]} -ne 0 ];
then
    echo "An error occurred partitioning ${_disk}" >&2
    echo "I cannot continue" >&2
    exit 2
fi
}
#end do_partition

scan_partition_format()
{
    log "Begin scanning and formatting data disks"

    DISKS=($(scan_for_new_disks))

	if [ "${#DISKS}" -eq 0 ];
	then
	    log "No unpartitioned disks without filesystems detected"
	    return
	fi
	echo "Disks are ${DISKS[@]}"
	for DISK in "${DISKS[@]}";
	do
	    echo "Working on ${DISK}"
	    is_partitioned ${DISK}
	    if [ ${?} -ne 0 ];
	    then
	        echo "${DISK} is not partitioned, partitioning"
	        do_partition ${DISK}
	    fi
	    PARTITION=$(fdisk -l ${DISK}|grep -A 1 Device|tail -n 1|awk '{print $1}')
	    has_filesystem ${PARTITION}
	    if [ ${?} -ne 0 ];
	    then
	        echo "Creating filesystem on ${PARTITION}."
	#        echo "Press Ctrl-C if you don't want to destroy all data on ${PARTITION}"
	#        sleep 10
	        mkfs -j -t ext4 ${PARTITION}
	    fi
	    MOUNTPOINT=$(get_next_mountpoint)
	    echo "Next mount point appears to be ${MOUNTPOINT}"
	    [ -d "${MOUNTPOINT}" ] || mkdir -p "${MOUNTPOINT}"
	    read UUID FS_TYPE < <(blkid -u filesystem ${PARTITION}|awk -F "[= ]" '{print $3" "$5}'|tr -d "\"")
	    add_to_fstab "${UUID}" "${MOUNTPOINT}"
	    echo "Mounting disk ${PARTITION} on ${MOUNTPOINT}"
	    mount "${MOUNTPOINT}"
	done
}

create_striped_volume()
{
    DISKS=(${@})

	if [ "${#DISKS[@]}" -eq 0 ];
	then
	    log "No unpartitioned disks without filesystems detected"
	    return
	fi

	echo "Disks are ${DISKS[@]}"

	declare -a PARTITIONS

	for DISK in "${DISKS[@]}";
	do
	    echo "Working on ${DISK}"
	    is_partitioned ${DISK}
	    if [ ${?} -ne 0 ];
	    then
	        echo "${DISK} is not partitioned, partitioning"
	        do_partition ${DISK} fd
	    fi

	    PARTITION=$(fdisk -l ${DISK}|grep -A 2 Device|tail -n 1|awk '{print $1}')
	    PARTITIONS+=("${PARTITION}")
	done

    MDDEVICE=$(get_next_md_device)
	udevadm control --stop-exec-queue
	mdadm --create ${MDDEVICE} --level 0 -c 64 --raid-devices ${#PARTITIONS[@]} ${PARTITIONS[*]}
	udevadm control --start-exec-queue

	MOUNTPOINT=$(get_next_mountpoint)
	echo "Next mount point appears to be ${MOUNTPOINT}"
	[ -d "${MOUNTPOINT}" ] || mkdir -p "${MOUNTPOINT}"

	#Make a file system on the new device
	STRIDE=128 #(512kB stripe size) / (4kB block size)
	PARTITIONSNUM=${#PARTITIONS[@]}
	STRIPEWIDTH=$((${STRIDE} * ${PARTITIONSNUM}))

	mkfs.ext4 -b 4096 -E stride=${STRIDE},stripe-width=${STRIPEWIDTH},nodiscard "${MDDEVICE}"

	read UUID FS_TYPE < <(blkid -u filesystem ${MDDEVICE}|awk -F "[= ]" '{print $3" "$5}'|tr -d "\"")

	add_to_fstab "${UUID}" "${MOUNTPOINT}"

	mount "${MOUNTPOINT}"
}

check_mdadm() {
    dpkg -s mdadm >/dev/null 2>&1
    if [ ${?} -ne 0 ]; then
        (apt-get -y update || (sleep 15; apt-get -y update)) > /dev/null
        DEBIAN_FRONTEND=noninteractive apt-get -y install mdadm --fix-missing
    fi
}

# Create Partitions
DISKS=$(scan_for_new_disks)

if [ "$RAID_CONFIGURATION" -eq 1 ]; then
    check_mdadm
    create_striped_volume "${DISKS[@]}"
else
    scan_partition_format
fi
"
 }
 PROTECTED_SETTINGS
 
 depends_on = [
   azurerm_virtual_machine_data_disk_attachment.atch
 ]
}
No Comments

Sorry, the comment form is closed at this time.