Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 3 additions & 1 deletion .github/workflows/test-gpu-rust.yml
Original file line number Diff line number Diff line change
Expand Up @@ -60,10 +60,12 @@ jobs:
# internal buck test behavior.
# The CI profile is configured in .config/nextest.toml
# Exclude filter is for packages that don't build in Github Actions yet.
# * monarch_messages: monarch/target/debug/deps/monarch_messages-...:
# * controller - Old system actor tests that we are trying to deprecate.
# * monarch_messages - torch-sys-cuda: monarch/target/debug/deps/monarch_messages-...:
# /lib64/libm.so.6: version `GLIBC_2.29' not found
# (required by /meta-pytorch/monarch/libtorch/lib/libtorch_cpu.so)
cargo nextest run --workspace --profile ci \
--exclude controller \
--exclude monarch_messages \
--exclude monarch_tensor_worker \
--exclude monarch_simulator_lib \
Expand Down
20 changes: 14 additions & 6 deletions controller/src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -665,7 +665,9 @@ mod tests {

use super::*;

#[tokio::test]
#[async_timed_test(timeout_secs = 30)]
// TODO: worker messages are 0 instead of 1, or sometimes times out.
#[cfg_attr(not(fbcode_build), ignore)]
async fn basic_controller() {
// TODO: Add a proper multiworker test
let proc = Proc::local();
Expand Down Expand Up @@ -856,6 +858,7 @@ mod tests {
);
}

// Can't use async_timed_test because of tokio::time::pause and advance.
#[tokio::test]
async fn worker_timeout() {
tokio::time::pause();
Expand Down Expand Up @@ -976,6 +979,7 @@ mod tests {
);
}

// Can't use async_timed_test because of tokio::time::pause and advance.
#[tokio::test]
async fn test_failure_on_worker_timeout() {
tokio::time::pause();
Expand Down Expand Up @@ -1113,7 +1117,9 @@ mod tests {
);
}

#[tokio::test]
#[async_timed_test(timeout_secs = 30)]
// TODO: sometimes times out.
#[cfg_attr(not(fbcode_build), ignore)]
async fn failure_propagation() {
// Serve a system.
let server_handle = System::serve(
Expand Down Expand Up @@ -1342,7 +1348,7 @@ mod tests {
)
}

#[tokio::test]
#[async_timed_test(timeout_secs = 30)]
async fn test_eager_failure_reporting() {
// Serve a system.
let server_handle = System::serve(
Expand Down Expand Up @@ -1515,7 +1521,7 @@ mod tests {
assert_eq!(successes, 1);
}

#[tokio::test]
#[async_timed_test(timeout_secs = 30)]
async fn test_bootstrap() {
let server_handle = System::serve(
ChannelAddr::any(ChannelTransport::Local),
Expand Down Expand Up @@ -1592,7 +1598,8 @@ mod tests {
)
}

#[tokio::test]
#[async_timed_test(timeout_secs = 30)]
#[cfg_attr(not(fbcode_build), ignore)]
async fn test_sim_supervision_failure() {
// Start system actor.
simnet::start();
Expand Down Expand Up @@ -1702,7 +1709,8 @@ mod tests {
let records = simnet::simnet_handle().unwrap().close().await.unwrap();
eprintln!("{}", serde_json::to_string_pretty(&records).unwrap());
}
#[tokio::test]

#[async_timed_test(timeout_secs = 30)]
async fn test_supervision_failure() {
// Start system actor.
let timeout: Duration = Duration::from_secs(6);
Expand Down
Loading