#!/bin/bash # # Copyright (c) 2024, Barcelona Supercomputing Center (BSC) # SPDX-License-Identifier: MIT # # Based on a script provided by Xavier Martorell # Rewritten by Rodrigo Arias Mallo <rodrigo.arias@bsc.es> # Stop on first error set -e function is_module_loaded() # {{{ { lsmod | grep -wq "$1" } # }}} function check_environment() # {{{ { if ! command -v dma-ctl &> /dev/null; then echo "error: dma-ctl not found in PATH" >&2 exit 1 fi if ! command -v vivado &> /dev/null; then echo "error: vivado not found in PATH" >&2 exit 1 fi } # }}} function create_qdma_queue() # {{{ { if [ ! -d "$pcidir" ]; then echo "missing pci directory: $pcidir" >&2 exit 1 fi if [ ! -d "$pcidir/qdma" ]; then echo "missing qdma directory: $pcidir/qdma" >&2 exit 1 fi if [ ! -f "$pcidir/qdma/qmax" ]; then echo "missing qmax file: $pcidir/qdma/qmax" >&2 exit 1 fi if [ ! -r "$pcidir/qdma/qmax" ]; then echo "cannot read qmax file: $pcidir/qdma/qmax" >&2 exit 1 fi # There should be two queues local qmax=$(cat "$pcidir/qdma/qmax") if [ "$qmax" != 2 ]; then if [ -w "$pcidir/qdma/qmax" ]; then echo 2 | dd of="$pcidir/qdma/qmax" else echo 2 | sudo dd of="$pcidir/qdma/qmax" fi fi # Create the two queues if they don't exist if [ ! -c "/dev/${qdmadev}-MM-1" ]; then dma-ctl "${qdmadev}" q add mode mm idx 1 dir bi dma-ctl "${qdmadev}" q start idx 1 dir bi fi if [ ! -c "/dev/${qdmadev}-MM-0" ]; then dma-ctl "${qdmadev}" q add mode mm idx 0 dir bi dma-ctl "${qdmadev}" q start idx 0 dir bi fi # Wait for udev to process the new devices udevadm settle # Ensure we have write access. On some clusters this is automatically done # by udev rules, on others we are expect to use sudo. for f in /dev/${qdmadev}-MM-{0,1} ${pcidir}/resource{0,0_wc,2,2_wc}; do test -w "$f" || sudo chmod go+rw "$f" done sleep 2 } # }}} function do_cpu_reset() # {{{ { if [ "$model" == "hun" ]; then # UartBootEn (bit2) + system reset (bit0) dma-ctl "${qdmadev}" reg write bar 2 0x0 0x0 sleep 0.2 dma-ctl "${qdmadev}" reg write bar 2 0x0 0x1 elif [ "$model" == "ox" ]; then dma-ctl "${qdmadev}" reg write bar 2 0x0 0x0 sleep 0.2 fi } # }}} function do_cpu_release() # {{{ { if [ "$model" == "hun" ]; then # Release Ariane's reset dma-ctl "${qdmadev}" reg write bar 2 0x0 0x3 elif [ "$model" == "ox" ]; then dma-ctl "${qdmadev}" reg write bar 2 0x0 0x1 sleep 1 fi } # }}} function copy_by_dma() # {{{ { ifile="$1" address="$2" ofile="/dev/${qdmadev}-MM-1" #bs=$((8*1024*1024)) # 8 MiB bs=$((1*1024*1024)) # 1 MiB total_size=$(stat --format "%s" "$ifile") nblocks=$(( ($total_size + $bs - 1) / $bs )) skip=0 # Using just a single dd command doesn't seem to work. My hypothesis is that # the driver doesn't allow multiple writes without setting the fseek position. # So we keep copying blocks until the end of the file, one at a time. while [ "$skip" -lt "$nblocks" ]; do dst=$(($address + $skip * $bs)) dd if="$ifile" skip=$skip count=1 bs=$bs of="$ofile" seek=$dst oflag=seek_bytes status=none let skip=$skip+1 done #dma-to-device -d "$ofile" -s "$total_size" -a "$address" -f "$ifile" } # }}} function load_file_in_memory() # {{{ { file="$1" address_hex="$2" address=$(($address_hex)) total_size=$(stat --format "%s" "$file") # Previous tests... #strace -f dma-to-device -d /dev/${qdmadev}-MM-1 -a "$address" -s $((8*1024*1024)) -f "$file" #strace -f dd if="$file" bs=16M seek="${address}" oflag=seek_bytes of=/dev/${qdmadev}-MM-1 status=progress conv=sync #strace -f fpgakit/fpgadd -i "$file" -a "$address" -d /dev/${qdmadev}-MM-1 -c 1024 -s 1024 #ID=08 ./load_image.sh "$file" "$address" # Now dd seems to work fine, but I will leave this as fallback: copy_by_dma "$file" "$address" #dd if="$file" bs=8M seek="${address}" oflag=seek_bytes of=/dev/${qdmadev}-MM-1 status=none printf "loaded '%s' at 0x%x with size %d\n" "$file" "$address" "$total_size" >&2 } # }}} function do_boot_only() # {{{ { do_cpu_reset ./load_image.sh ${OSBI} $((0x80000000)) && rm -f ${OSBI} && sleep 2 && # #Release Ariane's reset dma-ctl "${qdmadev}" reg write bar 2 0x0 0x3 && sleep 10 && echo mount -o nolock -o rw -o retrans=10 10.0.2.2:/media/sda2/scratch/xavim/point /root && echo mount -o nolock -o rw -o retrans=10 192.168.0.16:/media/sda2/scratch/xavim/point /root && if [ ! -c "/dev/${qdmadev}-MM-0" ] ; then /home/tools/drivers/`/bin/hostname`/dma_ip_drivers-onic-gamma/create-queue-qdma.sh -2 fi && sleep 2 #&& # uncomment to enable eth-over-pcie #sudo ifconfig onic${onicid}s0f0 10.0.2.2 netmask 255.255.255.0 mtu 9000 up sudo ifconfig onic${onicid}s0f0 10.0.2.2 netmask 255.255.255.0 up } # }}} function do_reload_fs() # {{{ { do_cpu_reset #~xavim/LAGARTO_LINUX-4.1/./load_image.sh \ # /home/xavim/ARIANE_LINUX-3.0/recovery/fedora-fs-dx-java-cucu-0.108.raw.recovered \ # $((0x13ff00000)) && load_file_in_memory /home/xavim/ARIANE_LINUX-3.0/recovery/fedora-fs-dx-java-cucu-0.108.raw.recovered $((0x13ff00000)) sleep 1 # Load OpenSBI + kernel load_file_in_memory ${OSBI} $((0x80000000)) rm -f ${OSBI} sleep 2 do_cpu_release create_qdma_queue # uncomment to enable eth-over-pcie # sudo ifconfig onic${onicid}s0f0 10.0.2.2 netmask 255.255.255.0 mtu 9000 up } # }}} function upload_bitstream_file() # {{{ { if [ -z "$jtagserial" ]; then >&2 echo "JTAG serial required" usage fi if [ -z "$bitstream" ]; then >&2 echo "bitstream file required" usage fi script=$(mktemp vivado-XXXXXXXXXX.tcl) cat > "$script" <<EOF open_hw_manager connect_hw_server -url localhost:3121 current_hw_target "localhost:3121/xilinx_tcf/Xilinx/${jtagserial}A" open_hw_target set dev [lindex [get_hw_devices] 0] current_hw_device \$dev set_property PROGRAM.FILE ${bitstream} \$dev program_hw_devices \$dev exit EOF vivado -nolog -nojournal -mode batch -source "$script" rm "$script" killall hw_server } # }}} function unload_modules() # {{{ { drvlist="$1" # Unload modules for mod in $drvlist; do if is_module_loaded "$mod"; then sudo rmmod $mod fi done } # }}} function remove_pci_devices() # {{{ { for slot in $(lspci -mm -d 10ee: | awk '{printf "0000:%s\n",$1}'); do devdir="/sys/bus/pci/devices/$slot" if [ -d $devdir ]; then if [ -w "$devdir/remove" ]; then echo 1 | dd "of=$devdir/remove" else echo 1 | sudo dd "of=$devdir/remove" fi fi done } # }}} function rescan_pci_devices() # {{{ { if [ -w /sys/bus/pci/rescan ]; then echo 1 | dd of=/sys/bus/pci/rescan else echo 1 | sudo dd of=/sys/bus/pci/rescan fi } # }}} function load_qdma_modules() # {{{ { drv="$DMA_IP_DRIVERS/QDMA/linux-kernel/bin/qdma-pf.ko" hw_buffers="$((0x4FFE0000))" if [ ! -r "$drv" ]; then echo "error: missing $" exit 1 fi sudo insmod "$drv" "hw_buffers=$hw_buffers" sleep 4 } # }}} function select_pcidev() # {{{ { if [ -z "$pcidev" ]; then >&2 echo -e "error: missing PCI device (hint: lspci -d 10ee:902f)" usage fi # Ensure it is ok local matches=$(lspci -s "$pcidev") if [ -z "$matches" ]; then >&2 echo "no match for PCI device '$pcidev'" exit 1 fi local n="$(echo "$matches" | wc -l)" if [ "$n" -gt 1 ]; then >&2 echo "multiple matches for PCI device '$pcidev'" exit 1 fi # Fill the PCI device with the domain local fulldev=$(lspci -s "$pcidev" -D | cut -d' ' -f1) pcidir="/sys/bus/pci/devices/$fulldev" if [ ! -d "$pcidir" ]; then >&2 echo "cannot find PCI dir: $pcidir" exit 1 fi # Set the PCI device to the full device pcidev="$fulldev" # Find slot slot=$(lspci -s "$pcidev" -vm | grep PhySlot | cut -f2) if [ -z "$slot" ]; then >&2 echo "cannot find physical slot for PCI '$pcidev'" exit 1 fi local devid=$(echo "$pcidev" | cut -d: -f2- | tr -d ':.') qdmadev="qdma${devid}" } # }}} function preload_hook() #{{{ { case "$hostname" in cucu) unload_modules "xocl xclmgmt qdma_pf xdma" # qdma_vf not removable remove_pci_devices ;; fpgan*) ;; *) echo "hostname $hostname not known" exit 1 ;; esac } #}}} function postload_hook() #{{{ { rescan_pci_devices case "$hostname" in cucu) unload_modules "qdma_pf xdma" # qdma_vf not removable remove_pci_devices load_qdma_modules rescan_pci_devices ;; fpgan*) ;; *) echo "hostname $hostname not known" exit 1 ;; esac create_qdma_queue } #}}} function load_bitstream() # {{{ { preload_hook upload_bitstream_file postload_hook } # }}} bitstream= bootloader= kernel= initrd= rootfs= resetcpu= verbose= pcidev= model=ox # Internal slot= pcidir= qdmadev= bootloader_addr="${FPGA_BOOTLOADER_ADDR:-0x80000000}" kernel_addr="${FPGA_KERNEL_ADDR:-0x84000000}" initrd_addr="${FPGA_INITRD_ADDR:-0x8c300000}" rootfs_addr="${FPGA_ROOTFS_ADDR:-0x140000000}" hostname="${hostname:-$(hostname)}" echo "hostname=$hostname" function usage() { echo "" >&2 echo "Usage: $0 [-p pcidev] [-v] [-w bitstream] [-j serial] [-b bootloader] [-k kernel] [-i initrd]" >&2 echo "" >&2 echo "First writes the bitstream if given. Then loads the rest of files" >&2 echo "into memory and restarts the CPU." >&2 echo "" >&2 echo "Options" >&2 echo " -p pcidev Select PCI device (same format as lspci -s)." >&2 echo " Read from \$FPGACTL_PCIDEV if not given." >&2 echo " -w bitstream Write the bitstream file to the FPGA" >&2 echo " -j serial JTAG serial (can be found by lsusb -v)" >&2 echo " Read from \$FPGACTL_SERIAL if not given." >&2 echo " -b bootloader Load the bootloader file in $bootloader_addr" >&2 echo " -k kernel Load the kernel file in $kernel_addr" >&2 echo " -i initrd Load the initrd file in $initrd_addr" >&2 echo " -r rootfs Load the rootfs file in $rootfs_addr" >&2 echo " -m model CPU model: Either 'hun' or 'ox' (default ox)" >&2 echo " -v Be verbose" >&2 echo "" >&2 exit 1 } while getopts "hvw:b:k:i:r:p:j:m:" opt; do case "${opt}" in v) verbose=1 ;; w) bitstream="${OPTARG}" ;; b) bootloader="${OPTARG}"; resetcpu=1 ;; k) kernel="${OPTARG}"; resetcpu=1 ;; i) initrd="${OPTARG}"; resetcpu=1 ;; r) rootfs="${OPTARG}"; resetcpu=1 ;; p) pcidev="${OPTARG}" ;; j) jtagserial="${OPTARG}" ;; m) model="${OPTARG}" ;; h) usage ;; *) usage ;; esac done jtagserial="${jtagserial:-$FPGACTL_SERIAL}" pcidev="${pcidev:-$FPGACTL_PCIDEV}" test "$verbose" && set -x check_environment select_pcidev test "$bitstream" && load_bitstream "$bitstream" test "$resetcpu" && do_cpu_reset test "$bootloader" && load_file_in_memory "$bootloader" $bootloader_addr test "$kernel" && load_file_in_memory "$kernel" $kernel_addr test "$initrd" && load_file_in_memory "$initrd" $initrd_addr test "$rootfs" && load_file_in_memory "$rootfs" $rootfs_addr test "$resetcpu" && do_cpu_release exit 0 # vim:ts=2:sw=2:ai:foldmethod=marker:foldlevel=0: