-
Notifications
You must be signed in to change notification settings - Fork 15
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Update Moneo Exporter for MI300 (#81)
* update moneo for mi300 * fix comments
- Loading branch information
Showing
4 changed files
with
110 additions
and
32 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,31 @@ | ||
# Use ROCm development image | ||
FROM rocm/dev-ubuntu-22.04:6.1.1 | ||
|
||
# Metadata | ||
LABEL maintainer="Moneo" | ||
|
||
# Environment variables | ||
ENV ROCM_VERSION=6.1.1 \ | ||
DEBIAN_FRONTEND=noninteractive | ||
|
||
# Work directory setup | ||
WORKDIR /root/Moneo | ||
COPY . . | ||
|
||
# Installing packages and setting up Python | ||
RUN apt-get update -y && apt-get install -y --no-install-recommends \ | ||
numactl git curl cmake ibverbs-utils sudo systemd wget libgomp1 libcap2-bin python3.10 python3-pip && \ | ||
cd /usr/bin && rm python3 && ln -s python3.10 python3 && \ | ||
python3 -m pip install --upgrade pip && \ | ||
python3 -m pip install prometheus_client psutil | ||
|
||
# # RDC installation | ||
WORKDIR /root/Moneo/src/worker | ||
RUN sudo bash install/amd.sh | ||
|
||
# Set EntryPoint | ||
COPY dockerfile/moneo-exporter-amd_entrypoint.sh . | ||
RUN chmod +x moneo-exporter-amd_entrypoint.sh | ||
|
||
# Final CMD | ||
CMD ["/bin/bash", "moneo-exporter-amd_entrypoint.sh"] |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,27 @@ | ||
#!/bin/bash | ||
set -e | ||
|
||
# Stops previous instances of AMD RDC Daemon and Exporter | ||
bash shutdown.sh | ||
|
||
# Launches AMD RDC Daemon | ||
nohup /opt/rocm/bin/rdcd -u </dev/null >/dev/null 2>&1 & | ||
|
||
# Initiates AMD and Network Exporters | ||
echo "Starting AMD and Network Exporters" | ||
|
||
# Starts AMD Exporter | ||
python3 exporters/amd_exporter.py & | ||
echo "AMD Exporter Started!" | ||
|
||
# Starts Network Exporter with specified InfiniBand sysfs path | ||
python3 exporters/net_exporter.py --inifiband_sysfs=/hostsys/class/infiniband & | ||
echo "Network Exporter Started!" | ||
|
||
# Starts Node Exporter | ||
python3 exporters/node_exporter.py & | ||
echo "Node Exporter Started!" | ||
|
||
# Waits for any process to exit and returns the exit status | ||
wait -n | ||
exit $? |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters