diff --git a/sysadmin/grid5000/cassandra/00-reserve_disks.sh b/sysadmin/grid5000/cassandra/00-reserve_disks.sh index 1dd7a4e..3c69fe8 100755 --- a/sysadmin/grid5000/cassandra/00-reserve_disks.sh +++ b/sysadmin/grid5000/cassandra/00-reserve_disks.sh @@ -1,18 +1,19 @@ #!/usr/bin/env bash set -eu SCRIPT_DIR="$(pwd $(dirname @0))" cd "${SCRIPT_DIR}" source "${SCRIPT_DIR}/environment.cfg" +# ${STORAGE_HOSTS} ${JOURNAL_CLIENT_HOSTS} ${MONITORING_HOSTS} NODE_FILTER="" -for node in ${CASSANDRA_HOSTS} ${STORAGE_HOSTS} ${JOURNAL_CLIENT_HOSTS} ${MONITORING_HOSTS}; do +for node in ${CASSANDRA_HOSTS}; do NODE_FILTER="${NODE_FILTER},'${node}.${G5K_SITE}'" done NODE_FILTER="$(echo ${NODE_FILTER} | sed 's/^,//')" NODE_COUNT="$(echo ${NODE_FILTER} | tr ',' ' ' | wc -w)" oarsub -t noop -l "{type='disk' and host in (${NODE_FILTER})}/host=${NODE_COUNT}/disk=${CASSANDRA_DISKS_COUNT},walltime=${DISK_RESERVATION_DURATION}" diff --git a/sysadmin/grid5000/cassandra/01-run-interactive.sh b/sysadmin/grid5000/cassandra/01-run-interactive.sh new file mode 100755 index 0000000..d337481 --- /dev/null +++ b/sysadmin/grid5000/cassandra/01-run-interactive.sh @@ -0,0 +1,7 @@ +#!/usr/bin/env bash + +set -eu + +SCRIPT_DIR="$(pwd $(dirname @0))" + +${SCRIPT_DIR}/02-reserve_nodes_interactive.sh diff --git a/sysadmin/grid5000/cassandra/01-run.sh b/sysadmin/grid5000/cassandra/01-run.sh index 12b2534..5fdf4a3 100755 --- a/sysadmin/grid5000/cassandra/01-run.sh +++ b/sysadmin/grid5000/cassandra/01-run.sh @@ -1,13 +1,26 @@ #!/usr/bin/env bash set -eu SCRIPT_DIR="$(pwd $(dirname @0))" +source "${SCRIPT_DIR}/environment.cfg" + ${SCRIPT_DIR}/02-reserve_nodes.sh echo "########### Waiting for node installations" while [ ! -e ${SCRIPT_DIR}/nodes.installed ]; do sleep 2 done -echo "########### Node installations detected" +echo "########### Node installations done" + +echo "########### Initialize cassandra" +FIRST_STORAGE_HOST="$(echo ${STORAGE_HOSTS} | cut -f1 -d' ')" +STORAGE_NODE="${FIRST_STORAGE_HOST}.${G5K_SITE}" + +ssh "${SSH_USER}@${STORAGE_NODE}" /usr/local/bin/swh-storage-init-cassandra.sh + +echo "####### FINISHED" + +echo "####### Sleeping" +sleep infinity diff --git a/sysadmin/grid5000/cassandra/02-reserve_nodes.sh b/sysadmin/grid5000/cassandra/02-reserve_nodes.sh index a0c1c13..c1463d5 100755 --- a/sysadmin/grid5000/cassandra/02-reserve_nodes.sh +++ b/sysadmin/grid5000/cassandra/02-reserve_nodes.sh @@ -1,19 +1,25 @@ #!/usr/bin/env bash set -eu SCRIPT_DIR="$(pwd $(dirname @0))" source "${SCRIPT_DIR}/environment.cfg" NODE_FILTER="" for node in ${CASSANDRA_HOSTS} ${STORAGE_HOSTS} ${JOURNAL_CLIENT_HOSTS} ${MONITORING_HOSTS}; do NODE_FILTER="${NODE_FILTER},'${node}.${G5K_SITE}'" done NODE_FILTER="$(echo ${NODE_FILTER} | sed 's/^,//')" NODE_COUNT="$(echo ${NODE_FILTER} | tr ',' ' ' | wc -w)" -oarsub -r '2021-06-08 19:05:00' -l "{host in (${NODE_FILTER})}/nodes=${NODE_COUNT},walltime=${NODE_RESERVATION_DURATION}" -t deploy ${SCRIPT_DIR}/03-deploy_nodes.sh -# -t besteffort -# -r '2021-06-08 19:05:00' +if [ -e OAR_JOB_ID ]; then + echo "Running in reservation mode, nodes should be already reserved" + ${SCRIPT_DIR}/03-deploy_nodes.sh +else + echo "Reserving and installing nodes" + oarsub -l "{host in (${NODE_FILTER})}/nodes=${NODE_COUNT},walltime=${NODE_RESERVATION_DURATION}" -t deploy ${SCRIPT_DIR}/03-deploy_nodes.sh + # -t besteffort + # -r '2021-06-08 19:05:00' +fi diff --git a/sysadmin/grid5000/cassandra/00-reserve_disks.sh b/sysadmin/grid5000/cassandra/02-reserve_nodes_interactive.sh similarity index 69% copy from sysadmin/grid5000/cassandra/00-reserve_disks.sh copy to sysadmin/grid5000/cassandra/02-reserve_nodes_interactive.sh index 1dd7a4e..94d7e31 100755 --- a/sysadmin/grid5000/cassandra/00-reserve_disks.sh +++ b/sysadmin/grid5000/cassandra/02-reserve_nodes_interactive.sh @@ -1,18 +1,17 @@ #!/usr/bin/env bash set -eu SCRIPT_DIR="$(pwd $(dirname @0))" -cd "${SCRIPT_DIR}" source "${SCRIPT_DIR}/environment.cfg" NODE_FILTER="" for node in ${CASSANDRA_HOSTS} ${STORAGE_HOSTS} ${JOURNAL_CLIENT_HOSTS} ${MONITORING_HOSTS}; do NODE_FILTER="${NODE_FILTER},'${node}.${G5K_SITE}'" done NODE_FILTER="$(echo ${NODE_FILTER} | sed 's/^,//')" NODE_COUNT="$(echo ${NODE_FILTER} | tr ',' ' ' | wc -w)" -oarsub -t noop -l "{type='disk' and host in (${NODE_FILTER})}/host=${NODE_COUNT}/disk=${CASSANDRA_DISKS_COUNT},walltime=${DISK_RESERVATION_DURATION}" +oarsub -I -l "{host in (${NODE_FILTER})}/nodes=${NODE_COUNT},walltime=${NODE_RESERVATION_DURATION}" -t deploy diff --git a/sysadmin/grid5000/cassandra/03-deploy_nodes.sh b/sysadmin/grid5000/cassandra/03-deploy_nodes.sh index 8b7642f..66dabdb 100755 --- a/sysadmin/grid5000/cassandra/03-deploy_nodes.sh +++ b/sysadmin/grid5000/cassandra/03-deploy_nodes.sh @@ -1,35 +1,33 @@ #!/usr/bin/env bash -# set -eu +set -eu SCRIPT_DIR="$(pwd $(dirname @0))" source "${SCRIPT_DIR}/environment.cfg" -INSTALL_USER=root - echo "########### Nodes:" uniq "${OAR_FILE_NODES}" echo "########### Installing os on nodes" INSTALLED_OS_STAMP="${OAR_JOB_ID}.os.stamp" if [ ! -e "${SCRIPT_DIR}/${INSTALLED_OS_STAMP}" ]; then ${SCRIPT_DIR}/_install_os.sh touch "${SCRIPT_DIR}/${INSTALLED_OS_STAMP}" fi uniq "${OAR_NODE_FILE}" > ${SCRIPT_DIR}/nodes.lst echo "${CASSANDRA_HOSTS}" | sed 's/ /,/' > ${SCRIPT_DIR}/cassandra_seeds.lst -parallel rsync -avP . "${INSTALL_USER}"@{}:install < ${SCRIPT_DIR}/nodes.lst +parallel --halt now,fail=1 rsync -avP . "${SSH_USER}"@{}:install < ${SCRIPT_DIR}/nodes.lst -time parallel -u ssh "${INSTALL_USER}"@{} install/_provision_node.sh < ${SCRIPT_DIR}/nodes.lst +time parallel --halt now,fail=1 -u ssh ${SSH_OPTIONS} "${SSH_USER}"@{} install/_provision_node.sh < ${SCRIPT_DIR}/nodes.lst echo "########### Cassandra installation done" touch ${SCRIPT_DIR}/nodes.installed # The script must not exit to avoid the oar job to be killed echo "########### Sleeping" sleep infinity diff --git a/sysadmin/grid5000/cassandra/Readme.md b/sysadmin/grid5000/cassandra/Readme.md index 5d830d9..a13d76e 100644 --- a/sysadmin/grid5000/cassandra/Readme.md +++ b/sysadmin/grid5000/cassandra/Readme.md @@ -1,250 +1,257 @@ Grid5000 terraform provisioning =============================== - [Grid5000 terraform provisioning](#grid5000-terraform-provisioning) - [Prerequisite](#prerequisite) - [Run](#run) - [Local (on vagrant)](#local-on-vagrant) - [On Grid5000](#on-grid5000) - [Via the custom script](#via-the-custom-script) - [Reservation configuration](#reservation-configuration) - [Nodes configuration](#nodes-configuration) - [Execution](#execution) - [(deprecated) With terraform](#deprecated-with-terraform) - [Cleanup](#cleanup) - [TODO](#todo) - [Possible improvments](#possible-improvments) Prerequisite ------------ Tools ##### terraform >= 13.0 vagrant >= 2.2.3 [for local tests only] Credentials ########### * grid5000 credentials ``` cat < ~/.grid5000.yml uri: https://api.grid5000.fr username: username password: password EOF ``` Theses credentials will be used to interact with the grid5000 api to create the jobs * Private/public key files (id_rsa) in the `~/.ssh` directory The public key will be installed on the nodes Run --- ### Local (on vagrant) The `Vagrantfile` is configured to provision 3 nodes, install cassandra and the configure the cluster using the ansible configuration: ``` vagrant up vagrant ssh cassandra1 sudo -i nodetool status ``` If everything is ok, the `nodetool` command line returns: ``` root@cassandra1:~# nodetool status Datacenter: datacenter1 ======================= Status=Up/Down |/ State=Normal/Leaving/Joining/Moving -- Address Load Tokens Owns (effective) Host ID Rack UN 10.168.180.12 15.78 KiB 256 67.9% 05d61a24-832a-4936-b0a5-39926f800d09 rack1 UN 10.168.180.11 73.28 KiB 256 67.0% 23d855cc-37d6-43a7-886e-9446e7774f8d rack1 UN 10.168.180.13 15.78 KiB 256 65.0% c6bc1eff-fa0d-4b67-bc53-fc31c6ced5bb rack1 ``` Cassandra can take some time to start, so you have to wait before the cluster stabilize itself. ### On Grid5000 Useful link: Hardware information: https://www.grid5000.fr/w/Hardware Resources availability: https://www.grid5000.fr/w/Status #### Via the custom script ##### Reservation configuration The configuration is defined on the `environment.cfg` file. In this file, g5k sites, cluster, nodes and reparition can be configured. ##### Nodes configuration The node installation is done by ansible. It needs to know the node topology to correctly configure the tools (zfs pools and dataset, cassandra seed, ...) The configuration is centralized in the `ansible/hosts.yml` file ##### Execution 1. Transfer the files on g5k on the right site: ``` rsync -avP --exclude .vagrant --exclude .terraform cassandra access.grid5000.fr:/ ``` 2. Connect to the right site ``` ssh access.grid5000.fr ssh ``` 3. Reserve the disks The disks must be reserved before the node creation or they will not be detected on the nodes ``` ./00-reserve_disks.sh ``` check the status of the job / the resources status to be sure they are correctly reserved ``` $ oarstat -fj | grep state state = Running ``` The state must be running -4. Launch a complete run +4. Launch a complete run +For an interactive mode: ``` -./01-run.sh +./01-run-interactive.sh ``` DISCLAIMER: Actually, it only runs the following steps: - reserve the nodes - install the os on all the nodes - launch ansible on all the nodes The underlying scripts can by run indepedently if they need to be restarted: - `02-reserver-nodes.sh`: Reserve the node resources - `03-deploy-nodes.sh`: Install the os (only one time per reservation) and launch ansible on all the nodes. To force an os resinstalltion, remove the `.os.stamp` file -5. Cleanup the resources + +In a reservation: + +TODO the scripts need to be reorganized to automatize the scheduled resource reservation + +1. Cleanup the resources To release the nodes: ``` oarstat -u ``` ``` oardel ``` #### (deprecated) With terraform Terraform can be greate to reserve the resources but it doesn't not allow manage the scheduled jobs * Initialize terraform modules (first time only) ``` terraform init ``` * Test the plan It only check the status of the declared resources compared to the grid5000 status. It's a read only operation, no actions on grid5000 will be perform. ``` terraform plan ``` * Execute the plan ``` terraform apply ``` This action creates the job, provisions the nodes according the `main.tf` file content and install the specified linux distribution on it. This command will log the reserved node name in output. For example for a 1 node reservation: ``` grid5000_job.cassandra: Creating... grid5000_job.cassandra: Still creating... [10s elapsed] grid5000_job.cassandra: Creation complete after 11s [id=1814813] grid5000_deployment.my_deployment: Creating... grid5000_deployment.my_deployment: Still creating... [10s elapsed] grid5000_deployment.my_deployment: Still creating... [20s elapsed] grid5000_deployment.my_deployment: Still creating... [30s elapsed] grid5000_deployment.my_deployment: Still creating... [40s elapsed] grid5000_deployment.my_deployment: Still creating... [50s elapsed] grid5000_deployment.my_deployment: Still creating... [1m0s elapsed] grid5000_deployment.my_deployment: Still creating... [1m10s elapsed] grid5000_deployment.my_deployment: Still creating... [1m20s elapsed] grid5000_deployment.my_deployment: Still creating... [1m30s elapsed] grid5000_deployment.my_deployment: Still creating... [1m40s elapsed] grid5000_deployment.my_deployment: Still creating... [1m50s elapsed] grid5000_deployment.my_deployment: Still creating... [2m0s elapsed] grid5000_deployment.my_deployment: Still creating... [2m10s elapsed] grid5000_deployment.my_deployment: Creation complete after 2m12s [id=D-0bb76036-1512-429f-be99-620afa328b26] Apply complete! Resources: 2 added, 0 changed, 0 destroyed. Outputs: nodes = [ "chifflet-6.lille.grid5000.fr", ] ``` It's now possible to connect to the nodes: ``` $ ssh -A access.grid5000.fr $ ssh -A root@chifflet-6.lille.grid5000.fr Linux chifflet-6.lille.grid5000.fr 4.19.0-16-amd64 #1 SMP Debian 4.19.181-1 (2021-03-19) x86_64 Debian10-x64-base-2021060212 (Image based on Debian Buster for AMD64/EM64T) Maintained by support-staff Doc: https://www.grid5000.fr/w/Getting_Started#Deploying_nodes_with_Kadeploy root@chifflet-6:~# ``` Cleanup ------- To destroy the resources before the end of the job: ``` terraform destroy ``` If the job is stopped, simply remove the `terraform.tfstate` file: ``` rm terraform.tfstate ``` ## TODO [X] variablization of the script [X] Ansible provisionning of the nodes [X] disk initialization [X] support different cluster topologies (nodes / disks / ...) [X] cassandra installation [X] swh-storage installation [ ] journal client for mirroring [ ] monitoring by prometheus [ ] Add a tool to erase the reserved disks (useful to avoid zfs to detect the previous pools and be able to restart from scratch) ## Possible improvments [ ] Use several besteffort jobs for cassandra nodes. They can be interrupted but don't have duration restrictions. +[ ] Create a cassandra base image to speedup the environment initialization diff --git a/sysadmin/grid5000/cassandra/Vagrantfile b/sysadmin/grid5000/cassandra/Vagrantfile index 56dcabd..116dc98 100644 --- a/sysadmin/grid5000/cassandra/Vagrantfile +++ b/sysadmin/grid5000/cassandra/Vagrantfile @@ -1,75 +1,75 @@ # -*- mode: ruby -*- # vi: set ft=ruby : vms = { "cassandra1" => { :ip => "10.168.180.11", :memory => 2048, :cpus => 2, :type => 'cassandra', }, "cassandra2" => { :ip => "10.168.180.12", :memory => 2048, :cpus => 2, :type => 'cassandra', }, "cassandra3" => { :ip => "10.168.180.13", :memory => 2048, :cpus => 2, :type => 'cassandra', }, - "swh-storage" => { + "swh-storage1" => { :ip => "10.168.180.14", :memory => 1024, :cpus => 2, :type => 'swh-storage', }, } # Images/remote configuration $global_debian10_box = "debian10-20210517-1348" $global_debian10_box_url = "https://annex.softwareheritage.org/public/isos/libvirt/debian/swh-debian-10.9-amd64-20210517-1348.qcow2" vms.each { | vm_name, vm_props | Vagrant.configure("2") do |global_config| unless Vagrant.has_plugin?("libvirt") $stderr.puts <<-MSG vagrant-libvirt plugin is required for this. To install: `$ sudo apt install vagrant-libvirt MSG exit 1 end global_config.vm.define vm_name do |config| config.vm.box = $global_debian10_box config.vm.box_url = $global_debian10_box_url config.vm.box_check_update = false config.vm.hostname = vm_name config.vm.network :private_network, ip: vm_props[:ip], netmask: "255.255.0.0" config.vm.synced_folder ".", "/vagrant", type: 'nfs', nfs_version: 4 config.vm.provision :ansible do |ansible| ansible.verbose = true ansible.become = true ansible.playbook = "ansible/playbook.yml" ansible.inventory_path = "ansible/hosts.yml" end config.vm.provider :libvirt do |provider| provider.memory = vm_props[:memory] provider.cpus = vm_props[:cpus] provider.driver = 'kvm' if vm_props[:type] == "cassandra" provider.storage :file, :size => '1G' provider.storage :file, :size => '1G' provider.storage :file, :size => '1G' end end end end } diff --git a/sysadmin/grid5000/cassandra/_install_os.sh b/sysadmin/grid5000/cassandra/_install_os.sh index c4fa67c..0dc03a2 100755 --- a/sysadmin/grid5000/cassandra/_install_os.sh +++ b/sysadmin/grid5000/cassandra/_install_os.sh @@ -1,8 +1,6 @@ #!/usr/bin/env bash set -eux -INSTALL_USER=root - # Install the OS kadeploy3 -e debian10-x64-base -f "${OAR_FILE_NODES}" -k ~/.ssh/id_rsa.pub diff --git a/sysadmin/grid5000/cassandra/ansible/hosts.yml b/sysadmin/grid5000/cassandra/ansible/hosts.yml index 2004742..a530bda 100644 --- a/sysadmin/grid5000/cassandra/ansible/hosts.yml +++ b/sysadmin/grid5000/cassandra/ansible/hosts.yml @@ -1,86 +1,88 @@ # Global configuration swh-storage: hosts: - parasilo-[20:28].rennes.grid5000,fr: + parasilo-[20:28].rennes.grid5000.fr: # local vagrant hosts - swh-storage: + swh-storage1: + vars: + ansible_connection: local cassandra: hosts: dahu-[1:32].grenoble.grid5000.fr: parasilo-[1:19].rennes.grid5000.fr: # local vagrant hosts cassandra[1:9]: vars: ansible_connection: local cassandra_config_dir: /etc/cassandra cassandra_data_dir_base: /srv/cassandra cassandra_data_dir_system: "{{cassandra_data_dir_base}}/system" cassandra_data_dir: "{{ cassandra_data_dir_base }}/data" cassandra_commitlogs_dir: "{{ cassandra_data_dir_base }}/commitlogs" # Per cluster specificities dahu_cluster_hosts: hosts: dahu[1:32].grenoble.grid5000.fr vars: cassandra_listen_interface: enp24s0f0 parasilo_cluster_hosts: hosts: parasilo-[1:28].rennes.grid5000.fr: vars: cassandra_listen_interface: eno1 zfs_pools: commitlogs: disks: - sdf datasets: commitlogs: /srv/cassandra/commitlogs data: disks: - sdb - sdc - sdd - sde datasets: data: /srv/cassandra/data # Vagrant configuration vagrant_nodes: hosts: cassandra1: ansible_host: 10.168.180.11 ansible_user: vagrant ansible_ssh_private_key_file: .vagrant/machines/cassandra1/libvirt/private_key cassandra2: ansible_host: 10.168.180.12 ansible_user: vagrant ansible_ssh_private_key_file: .vagrant/machines/cassandra2/libvirt/private_key cassandra3: ansible_host: 10.168.180.13 ansible_user: vagrant ansible_ssh_private_key_file: .vagrant/machines/cassandra3/libvirt/private_key - swh-storage: + swh-storage1: ansible_host: 10.168.180.14 ansible_user: vagrant ansible_ssh_private_key_file: .vagrant/machines/swh-storage/libvirt/private_key vars: ansible_connection: ssh cassandra_listen_interface: eth1 # passed through --extra-vars on grid5000 cassandra_seed_ips: 10.168.180.11,10.168.180.12,10.168.180.13 zfs_pools: commitlogs: disks: - vdb datasets: commitlogs: /srv/cassandra/commitlogs data: disks: - vdc - vdd datasets: data: /srv/cassandra/data diff --git a/sysadmin/grid5000/cassandra/environment.cfg b/sysadmin/grid5000/cassandra/environment.cfg index 5fccee8..ad60d85 100644 --- a/sysadmin/grid5000/cassandra/environment.cfg +++ b/sysadmin/grid5000/cassandra/environment.cfg @@ -1,11 +1,16 @@ export G5K_SITE='rennes.grid5000.fr' export CASSANDRA_HOSTS="parasilo-2 parasilo-3 parasilo-4 parasilo-5" export CASSANDRA_DISKS_COUNT=5 -export STORAGE_HOSTS="parasilo-6" +export STORAGE_HOSTS="parasilo-20" export JOURNAL_CLIENT_HOSTS="" export MONITORING_HOSTS="" # export CASSANDRA_NB_DISK_PER_NODE=5 -export DISK_RESERVATION_DURATION=$((1 * 24)) -export NODE_RESERVATION_DURATION=10 # in hours +export DISK_RESERVATION_DURATION=$((1 * 24)) # 1day during tests +export NODE_RESERVATION_DURATION=00:50 # in hours + + +export SSH_USER=root +# export SSH_OPTIONS="-o UserKnownHostsFile=/dev/null -o StrictHostKeyChecking=no" +export SSH_OPTIONS=""