mirror of
https://github.com/exo-explore/exo.git
synced 2026-02-20 07:46:42 -05:00
Compare commits
4 Commits
feat/bug-r
...
test-scree
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
42e1e7322b | ||
|
|
aa3f106fb9 | ||
|
|
2e29605194 | ||
|
|
cacb456cb2 |
13
Cargo.lock
generated
13
Cargo.lock
generated
@@ -890,7 +890,7 @@ dependencies = [
|
|||||||
"delegate",
|
"delegate",
|
||||||
"env_logger",
|
"env_logger",
|
||||||
"extend",
|
"extend",
|
||||||
"futures",
|
"futures-lite",
|
||||||
"libp2p",
|
"libp2p",
|
||||||
"log",
|
"log",
|
||||||
"networking",
|
"networking",
|
||||||
@@ -914,6 +914,12 @@ dependencies = [
|
|||||||
"syn 2.0.111",
|
"syn 2.0.111",
|
||||||
]
|
]
|
||||||
|
|
||||||
|
[[package]]
|
||||||
|
name = "fastrand"
|
||||||
|
version = "2.3.0"
|
||||||
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
|
checksum = "37909eebbb50d72f9059c3b6d82c0463f2ff062c9e95845c43a6c9c0355411be"
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "ff"
|
name = "ff"
|
||||||
version = "0.13.1"
|
version = "0.13.1"
|
||||||
@@ -1022,7 +1028,10 @@ version = "2.6.1"
|
|||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "f78e10609fe0e0b3f4157ffab1876319b5b0db102a2c60dc4626306dc46b44ad"
|
checksum = "f78e10609fe0e0b3f4157ffab1876319b5b0db102a2c60dc4626306dc46b44ad"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
|
"fastrand",
|
||||||
"futures-core",
|
"futures-core",
|
||||||
|
"futures-io",
|
||||||
|
"parking",
|
||||||
"pin-project-lite",
|
"pin-project-lite",
|
||||||
]
|
]
|
||||||
|
|
||||||
@@ -2753,7 +2762,7 @@ dependencies = [
|
|||||||
"delegate",
|
"delegate",
|
||||||
"either",
|
"either",
|
||||||
"extend",
|
"extend",
|
||||||
"futures",
|
"futures-lite",
|
||||||
"futures-timer",
|
"futures-timer",
|
||||||
"keccak-const",
|
"keccak-const",
|
||||||
"libp2p",
|
"libp2p",
|
||||||
|
|||||||
@@ -29,14 +29,13 @@ util = { path = "rust/util" }
|
|||||||
# Macro dependecies
|
# Macro dependecies
|
||||||
extend = "1.2"
|
extend = "1.2"
|
||||||
delegate = "0.13"
|
delegate = "0.13"
|
||||||
pin-project = "1"
|
|
||||||
|
|
||||||
# Utility dependencies
|
# Utility dependencies
|
||||||
keccak-const = "0.2"
|
keccak-const = "0.2"
|
||||||
|
|
||||||
# Async dependencies
|
# Async dependencies
|
||||||
tokio = "1.46"
|
tokio = "1.46"
|
||||||
futures = "0.3"
|
futures-lite = "2.6.1"
|
||||||
futures-timer = "3.0"
|
futures-timer = "3.0"
|
||||||
|
|
||||||
# Data structures
|
# Data structures
|
||||||
|
|||||||
@@ -20,6 +20,7 @@ from harness import (
|
|||||||
instance_id_from_instance,
|
instance_id_from_instance,
|
||||||
nodes_used_in_instance,
|
nodes_used_in_instance,
|
||||||
resolve_model_short_id,
|
resolve_model_short_id,
|
||||||
|
run_planning_phase,
|
||||||
settle_and_fetch_placements,
|
settle_and_fetch_placements,
|
||||||
wait_for_instance_gone,
|
wait_for_instance_gone,
|
||||||
wait_for_instance_ready,
|
wait_for_instance_ready,
|
||||||
@@ -962,6 +963,21 @@ Examples:
|
|||||||
|
|
||||||
selected.sort(key=_placement_sort_key)
|
selected.sort(key=_placement_sort_key)
|
||||||
preview = selected[0]
|
preview = selected[0]
|
||||||
|
|
||||||
|
settle_deadline = (
|
||||||
|
time.monotonic() + args.settle_timeout if args.settle_timeout > 0 else None
|
||||||
|
)
|
||||||
|
|
||||||
|
print("Planning phase: checking downloads...", file=log)
|
||||||
|
run_planning_phase(
|
||||||
|
exo,
|
||||||
|
full_model_id,
|
||||||
|
preview,
|
||||||
|
args.danger_delete_downloads,
|
||||||
|
args.timeout,
|
||||||
|
settle_deadline,
|
||||||
|
)
|
||||||
|
|
||||||
instance = preview["instance"]
|
instance = preview["instance"]
|
||||||
instance_id = instance_id_from_instance(instance)
|
instance_id = instance_id_from_instance(instance)
|
||||||
sharding = str(preview["sharding"])
|
sharding = str(preview["sharding"])
|
||||||
|
|||||||
@@ -35,6 +35,7 @@ from harness import (
|
|||||||
instance_id_from_instance,
|
instance_id_from_instance,
|
||||||
nodes_used_in_instance,
|
nodes_used_in_instance,
|
||||||
resolve_model_short_id,
|
resolve_model_short_id,
|
||||||
|
run_planning_phase,
|
||||||
settle_and_fetch_placements,
|
settle_and_fetch_placements,
|
||||||
wait_for_instance_gone,
|
wait_for_instance_gone,
|
||||||
wait_for_instance_ready,
|
wait_for_instance_ready,
|
||||||
@@ -332,6 +333,20 @@ def main() -> int:
|
|||||||
if args.dry_run:
|
if args.dry_run:
|
||||||
return 0
|
return 0
|
||||||
|
|
||||||
|
settle_deadline = (
|
||||||
|
time.monotonic() + args.settle_timeout if args.settle_timeout > 0 else None
|
||||||
|
)
|
||||||
|
|
||||||
|
logger.info("Planning phase: checking downloads...")
|
||||||
|
run_planning_phase(
|
||||||
|
client,
|
||||||
|
full_model_id,
|
||||||
|
selected[0],
|
||||||
|
args.danger_delete_downloads,
|
||||||
|
args.timeout,
|
||||||
|
settle_deadline,
|
||||||
|
)
|
||||||
|
|
||||||
all_rows: list[dict[str, Any]] = []
|
all_rows: list[dict[str, Any]] = []
|
||||||
|
|
||||||
for preview in selected:
|
for preview in selected:
|
||||||
|
|||||||
150
bench/harness.py
150
bench/harness.py
@@ -282,6 +282,151 @@ def settle_and_fetch_placements(
|
|||||||
return selected
|
return selected
|
||||||
|
|
||||||
|
|
||||||
|
def run_planning_phase(
|
||||||
|
client: ExoClient,
|
||||||
|
full_model_id: str,
|
||||||
|
preview: dict[str, Any],
|
||||||
|
danger_delete: bool,
|
||||||
|
timeout: float,
|
||||||
|
settle_deadline: float | None,
|
||||||
|
) -> None:
|
||||||
|
"""Check disk space and ensure model is downloaded before benchmarking."""
|
||||||
|
# Get model size from /models
|
||||||
|
models = client.request_json("GET", "/models") or {}
|
||||||
|
model_bytes = 0
|
||||||
|
for m in models.get("data", []):
|
||||||
|
if m.get("hugging_face_id") == full_model_id:
|
||||||
|
model_bytes = m.get("storage_size_megabytes", 0) * 1024 * 1024
|
||||||
|
break
|
||||||
|
|
||||||
|
if not model_bytes:
|
||||||
|
logger.warning(
|
||||||
|
f"Could not determine size for {full_model_id}, skipping disk check"
|
||||||
|
)
|
||||||
|
return
|
||||||
|
|
||||||
|
# Get nodes from preview
|
||||||
|
inner = unwrap_instance(preview["instance"])
|
||||||
|
node_ids = list(inner["shardAssignments"]["nodeToRunner"].keys())
|
||||||
|
runner_to_shard = inner["shardAssignments"]["runnerToShard"]
|
||||||
|
|
||||||
|
state = client.request_json("GET", "/state")
|
||||||
|
downloads = state.get("downloads", {})
|
||||||
|
node_disk = state.get("nodeDisk", {})
|
||||||
|
|
||||||
|
for node_id in node_ids:
|
||||||
|
node_downloads = downloads.get(node_id, [])
|
||||||
|
|
||||||
|
# Check if model already downloaded on this node
|
||||||
|
already_downloaded = any(
|
||||||
|
"DownloadCompleted" in p
|
||||||
|
and unwrap_instance(p["DownloadCompleted"]["shardMetadata"])["modelCard"][
|
||||||
|
"modelId"
|
||||||
|
]
|
||||||
|
== full_model_id
|
||||||
|
for p in node_downloads
|
||||||
|
)
|
||||||
|
if already_downloaded:
|
||||||
|
continue
|
||||||
|
|
||||||
|
# Wait for disk info if settle_deadline is set
|
||||||
|
disk_info = node_disk.get(node_id, {})
|
||||||
|
backoff = _SETTLE_INITIAL_BACKOFF_S
|
||||||
|
while not disk_info and settle_deadline and time.monotonic() < settle_deadline:
|
||||||
|
remaining = settle_deadline - time.monotonic()
|
||||||
|
logger.info(
|
||||||
|
f"Waiting for disk info on {node_id} ({remaining:.0f}s remaining)..."
|
||||||
|
)
|
||||||
|
time.sleep(min(backoff, remaining))
|
||||||
|
backoff = min(backoff * _SETTLE_BACKOFF_MULTIPLIER, _SETTLE_MAX_BACKOFF_S)
|
||||||
|
state = client.request_json("GET", "/state")
|
||||||
|
node_disk = state.get("nodeDisk", {})
|
||||||
|
disk_info = node_disk.get(node_id, {})
|
||||||
|
|
||||||
|
if not disk_info:
|
||||||
|
logger.warning(f"No disk info for {node_id}, skipping space check")
|
||||||
|
continue
|
||||||
|
|
||||||
|
avail = disk_info.get("available", {}).get("inBytes", 0)
|
||||||
|
if avail >= model_bytes:
|
||||||
|
continue
|
||||||
|
|
||||||
|
if not danger_delete:
|
||||||
|
raise RuntimeError(
|
||||||
|
f"Insufficient disk on {node_id}: need {model_bytes // (1024**3)}GB, "
|
||||||
|
f"have {avail // (1024**3)}GB. Use --danger-delete-downloads to free space."
|
||||||
|
)
|
||||||
|
|
||||||
|
# Delete from smallest to largest
|
||||||
|
completed = [
|
||||||
|
(
|
||||||
|
unwrap_instance(p["DownloadCompleted"]["shardMetadata"])["modelCard"][
|
||||||
|
"modelId"
|
||||||
|
],
|
||||||
|
p["DownloadCompleted"]["totalBytes"]["inBytes"],
|
||||||
|
)
|
||||||
|
for p in node_downloads
|
||||||
|
if "DownloadCompleted" in p
|
||||||
|
]
|
||||||
|
for del_model, size in sorted(completed, key=lambda x: x[1]):
|
||||||
|
logger.info(f"Deleting {del_model} from {node_id} ({size // (1024**2)}MB)")
|
||||||
|
client.request_json("DELETE", f"/download/{node_id}/{del_model}")
|
||||||
|
avail += size
|
||||||
|
if avail >= model_bytes:
|
||||||
|
break
|
||||||
|
|
||||||
|
if avail < model_bytes:
|
||||||
|
raise RuntimeError(f"Could not free enough space on {node_id}")
|
||||||
|
|
||||||
|
# Start downloads (idempotent)
|
||||||
|
for node_id in node_ids:
|
||||||
|
runner_id = inner["shardAssignments"]["nodeToRunner"][node_id]
|
||||||
|
shard = runner_to_shard[runner_id]
|
||||||
|
client.request_json(
|
||||||
|
"POST",
|
||||||
|
"/download/start",
|
||||||
|
body={
|
||||||
|
"targetNodeId": node_id,
|
||||||
|
"shardMetadata": shard,
|
||||||
|
},
|
||||||
|
)
|
||||||
|
logger.info(f"Started download on {node_id}")
|
||||||
|
|
||||||
|
# Wait for downloads
|
||||||
|
start = time.time()
|
||||||
|
while time.time() - start < timeout:
|
||||||
|
state = client.request_json("GET", "/state")
|
||||||
|
downloads = state.get("downloads", {})
|
||||||
|
all_done = True
|
||||||
|
for node_id in node_ids:
|
||||||
|
done = any(
|
||||||
|
"DownloadCompleted" in p
|
||||||
|
and unwrap_instance(p["DownloadCompleted"]["shardMetadata"])[
|
||||||
|
"modelCard"
|
||||||
|
]["modelId"]
|
||||||
|
== full_model_id
|
||||||
|
for p in downloads.get(node_id, [])
|
||||||
|
)
|
||||||
|
failed = [
|
||||||
|
p["DownloadFailed"]["errorMessage"]
|
||||||
|
for p in downloads.get(node_id, [])
|
||||||
|
if "DownloadFailed" in p
|
||||||
|
and unwrap_instance(p["DownloadFailed"]["shardMetadata"])["modelCard"][
|
||||||
|
"modelId"
|
||||||
|
]
|
||||||
|
== full_model_id
|
||||||
|
]
|
||||||
|
if failed:
|
||||||
|
raise RuntimeError(f"Download failed on {node_id}: {failed[0]}")
|
||||||
|
if not done:
|
||||||
|
all_done = False
|
||||||
|
if all_done:
|
||||||
|
return
|
||||||
|
time.sleep(1)
|
||||||
|
|
||||||
|
raise TimeoutError("Downloads did not complete in time")
|
||||||
|
|
||||||
|
|
||||||
def add_common_instance_args(ap: argparse.ArgumentParser) -> None:
|
def add_common_instance_args(ap: argparse.ArgumentParser) -> None:
|
||||||
ap.add_argument("--host", default=os.environ.get("EXO_HOST", "localhost"))
|
ap.add_argument("--host", default=os.environ.get("EXO_HOST", "localhost"))
|
||||||
ap.add_argument(
|
ap.add_argument(
|
||||||
@@ -325,3 +470,8 @@ def add_common_instance_args(ap: argparse.ArgumentParser) -> None:
|
|||||||
default=0,
|
default=0,
|
||||||
help="Max seconds to wait for the cluster to produce valid placements (0 = try once).",
|
help="Max seconds to wait for the cluster to produce valid placements (0 = try once).",
|
||||||
)
|
)
|
||||||
|
ap.add_argument(
|
||||||
|
"--danger-delete-downloads",
|
||||||
|
action="store_true",
|
||||||
|
help="Delete existing models from smallest to largest to make room for benchmark model.",
|
||||||
|
)
|
||||||
|
|||||||
@@ -74,7 +74,6 @@
|
|||||||
perSystem =
|
perSystem =
|
||||||
{ config, self', inputs', pkgs, lib, system, ... }:
|
{ config, self', inputs', pkgs, lib, system, ... }:
|
||||||
let
|
let
|
||||||
fenixToolchain = inputs'.fenix.packages.complete;
|
|
||||||
# Use pinned nixpkgs for swift-format (swift is broken on x86_64-linux in newer nixpkgs)
|
# Use pinned nixpkgs for swift-format (swift is broken on x86_64-linux in newer nixpkgs)
|
||||||
pkgsSwift = import inputs.nixpkgs-swift { inherit system; };
|
pkgsSwift = import inputs.nixpkgs-swift { inherit system; };
|
||||||
in
|
in
|
||||||
|
|||||||
@@ -1,2 +0,0 @@
|
|||||||
# we can manually exclude false-positive lint errors for dual packages (if in dependencies)
|
|
||||||
#allowed-duplicate-crates = ["hashbrown"]
|
|
||||||
@@ -27,7 +27,7 @@ networking = { workspace = true }
|
|||||||
# interop
|
# interop
|
||||||
pyo3 = { version = "0.27.2", features = [
|
pyo3 = { version = "0.27.2", features = [
|
||||||
# "abi3-py313", # tells pyo3 (and maturin) to build using the stable ABI with minimum Python version 3.13
|
# "abi3-py313", # tells pyo3 (and maturin) to build using the stable ABI with minimum Python version 3.13
|
||||||
"nightly", # enables better-supported GIL integration
|
# "nightly", # enables better-supported GIL integration
|
||||||
"experimental-async", # async support in #[pyfunction] & #[pymethods]
|
"experimental-async", # async support in #[pyfunction] & #[pymethods]
|
||||||
#"experimental-inspect", # inspection of generated binary => easier to automate type-hint generation
|
#"experimental-inspect", # inspection of generated binary => easier to automate type-hint generation
|
||||||
#"py-clone", # adding Clone-ing of `Py<T>` without GIL (may cause panics - remove if panics happen)
|
#"py-clone", # adding Clone-ing of `Py<T>` without GIL (may cause panics - remove if panics happen)
|
||||||
@@ -45,11 +45,10 @@ pyo3-log = "0.13.2"
|
|||||||
# macro dependencies
|
# macro dependencies
|
||||||
extend = { workspace = true }
|
extend = { workspace = true }
|
||||||
delegate = { workspace = true }
|
delegate = { workspace = true }
|
||||||
pin-project = { workspace = true }
|
|
||||||
|
|
||||||
# async runtime
|
# async runtime
|
||||||
tokio = { workspace = true, features = ["full", "tracing"] }
|
tokio = { workspace = true, features = ["full", "tracing"] }
|
||||||
futures = { workspace = true }
|
futures-lite = { workspace = true }
|
||||||
|
|
||||||
# utility dependencies
|
# utility dependencies
|
||||||
util = { workspace = true }
|
util = { workspace = true }
|
||||||
@@ -60,3 +59,4 @@ env_logger = "0.11"
|
|||||||
|
|
||||||
# Networking
|
# Networking
|
||||||
libp2p = { workspace = true, features = ["full"] }
|
libp2p = { workspace = true, features = ["full"] }
|
||||||
|
pin-project = "1.1.10"
|
||||||
|
|||||||
@@ -2,7 +2,6 @@
|
|||||||
//!
|
//!
|
||||||
|
|
||||||
use pin_project::pin_project;
|
use pin_project::pin_project;
|
||||||
use pyo3::marker::Ungil;
|
|
||||||
use pyo3::prelude::*;
|
use pyo3::prelude::*;
|
||||||
use std::{
|
use std::{
|
||||||
future::Future,
|
future::Future,
|
||||||
@@ -26,8 +25,8 @@ where
|
|||||||
|
|
||||||
impl<F> Future for AllowThreads<F>
|
impl<F> Future for AllowThreads<F>
|
||||||
where
|
where
|
||||||
F: Future + Ungil,
|
F: Future + Send,
|
||||||
F::Output: Ungil,
|
F::Output: Send,
|
||||||
{
|
{
|
||||||
type Output = F::Output;
|
type Output = F::Output;
|
||||||
|
|
||||||
|
|||||||
@@ -4,25 +4,12 @@
|
|||||||
//!
|
//!
|
||||||
//!
|
//!
|
||||||
|
|
||||||
// enable Rust-unstable features for convenience
|
|
||||||
#![feature(trait_alias)]
|
|
||||||
#![feature(tuple_trait)]
|
|
||||||
#![feature(unboxed_closures)]
|
|
||||||
// #![feature(stmt_expr_attributes)]
|
|
||||||
// #![feature(assert_matches)]
|
|
||||||
// #![feature(async_fn_in_dyn_trait)]
|
|
||||||
// #![feature(async_for_loop)]
|
|
||||||
// #![feature(auto_traits)]
|
|
||||||
// #![feature(negative_impls)]
|
|
||||||
|
|
||||||
extern crate core;
|
|
||||||
mod allow_threading;
|
mod allow_threading;
|
||||||
pub(crate) mod networking;
|
mod ident;
|
||||||
pub(crate) mod pylibp2p;
|
mod networking;
|
||||||
|
|
||||||
|
use crate::ident::ident_submodule;
|
||||||
use crate::networking::networking_submodule;
|
use crate::networking::networking_submodule;
|
||||||
use crate::pylibp2p::ident::ident_submodule;
|
|
||||||
use crate::pylibp2p::multiaddr::multiaddr_submodule;
|
|
||||||
use pyo3::prelude::PyModule;
|
use pyo3::prelude::PyModule;
|
||||||
use pyo3::{Bound, PyResult, pyclass, pymodule};
|
use pyo3::{Bound, PyResult, pyclass, pymodule};
|
||||||
use pyo3_stub_gen::define_stub_info_gatherer;
|
use pyo3_stub_gen::define_stub_info_gatherer;
|
||||||
@@ -32,14 +19,6 @@ pub(crate) mod r#const {
|
|||||||
pub const MPSC_CHANNEL_SIZE: usize = 1024;
|
pub const MPSC_CHANNEL_SIZE: usize = 1024;
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Namespace for all the type/trait aliases used by this crate.
|
|
||||||
pub(crate) mod alias {
|
|
||||||
use std::marker::Tuple;
|
|
||||||
|
|
||||||
pub trait SendFn<Args: Tuple + Send + 'static, Output> =
|
|
||||||
Fn<Args, Output = Output> + Send + 'static;
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Namespace for crate-wide extension traits/methods
|
/// Namespace for crate-wide extension traits/methods
|
||||||
pub(crate) mod ext {
|
pub(crate) mod ext {
|
||||||
use crate::allow_threading::AllowThreads;
|
use crate::allow_threading::AllowThreads;
|
||||||
@@ -180,7 +159,6 @@ fn main_module(m: &Bound<'_, PyModule>) -> PyResult<()> {
|
|||||||
// work with maturin, where the types generate correctly, in the right folder, without
|
// work with maturin, where the types generate correctly, in the right folder, without
|
||||||
// too many importing issues...
|
// too many importing issues...
|
||||||
ident_submodule(m)?;
|
ident_submodule(m)?;
|
||||||
multiaddr_submodule(m)?;
|
|
||||||
networking_submodule(m)?;
|
networking_submodule(m)?;
|
||||||
|
|
||||||
// top-level constructs
|
// top-level constructs
|
||||||
|
|||||||
@@ -8,8 +8,8 @@
|
|||||||
use crate::r#const::MPSC_CHANNEL_SIZE;
|
use crate::r#const::MPSC_CHANNEL_SIZE;
|
||||||
use crate::ext::{ByteArrayExt as _, FutureExt, PyErrExt as _};
|
use crate::ext::{ByteArrayExt as _, FutureExt, PyErrExt as _};
|
||||||
use crate::ext::{ResultExt as _, TokioMpscReceiverExt as _, TokioMpscSenderExt as _};
|
use crate::ext::{ResultExt as _, TokioMpscReceiverExt as _, TokioMpscSenderExt as _};
|
||||||
|
use crate::ident::{PyKeypair, PyPeerId};
|
||||||
use crate::pyclass;
|
use crate::pyclass;
|
||||||
use crate::pylibp2p::ident::{PyKeypair, PyPeerId};
|
|
||||||
use libp2p::futures::StreamExt as _;
|
use libp2p::futures::StreamExt as _;
|
||||||
use libp2p::gossipsub;
|
use libp2p::gossipsub;
|
||||||
use libp2p::gossipsub::{IdentTopic, Message, MessageId, PublishError};
|
use libp2p::gossipsub::{IdentTopic, Message, MessageId, PublishError};
|
||||||
|
|||||||
@@ -1,8 +0,0 @@
|
|||||||
//! A module for exposing Rust's libp2p datatypes over Pyo3
|
|
||||||
//!
|
|
||||||
//! TODO: right now we are coupled to libp2p's identity, but eventually we want to create our own
|
|
||||||
//! independent identity type of some kind or another. This may require handshaking.
|
|
||||||
//!
|
|
||||||
|
|
||||||
pub mod ident;
|
|
||||||
pub mod multiaddr;
|
|
||||||
@@ -1,81 +0,0 @@
|
|||||||
use crate::ext::ResultExt as _;
|
|
||||||
use libp2p::Multiaddr;
|
|
||||||
use pyo3::prelude::{PyBytesMethods as _, PyModule, PyModuleMethods as _};
|
|
||||||
use pyo3::types::PyBytes;
|
|
||||||
use pyo3::{Bound, PyResult, Python, pyclass, pymethods};
|
|
||||||
use pyo3_stub_gen::derive::{gen_stub_pyclass, gen_stub_pymethods};
|
|
||||||
use std::str::FromStr as _;
|
|
||||||
|
|
||||||
/// Representation of a Multiaddr.
|
|
||||||
#[gen_stub_pyclass]
|
|
||||||
#[pyclass(name = "Multiaddr", frozen)]
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
#[repr(transparent)]
|
|
||||||
pub struct PyMultiaddr(pub Multiaddr);
|
|
||||||
|
|
||||||
#[gen_stub_pymethods]
|
|
||||||
#[pymethods]
|
|
||||||
#[allow(clippy::needless_pass_by_value)]
|
|
||||||
impl PyMultiaddr {
|
|
||||||
/// Create a new, empty multiaddress.
|
|
||||||
#[staticmethod]
|
|
||||||
fn empty() -> Self {
|
|
||||||
Self(Multiaddr::empty())
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Create a new, empty multiaddress with the given capacity.
|
|
||||||
#[staticmethod]
|
|
||||||
fn with_capacity(n: usize) -> Self {
|
|
||||||
Self(Multiaddr::with_capacity(n))
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Parse a `Multiaddr` value from its byte slice representation.
|
|
||||||
#[staticmethod]
|
|
||||||
fn from_bytes(bytes: Bound<'_, PyBytes>) -> PyResult<Self> {
|
|
||||||
let bytes = Vec::from(bytes.as_bytes());
|
|
||||||
Ok(Self(Multiaddr::try_from(bytes).pyerr()?))
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Parse a `Multiaddr` value from its string representation.
|
|
||||||
#[staticmethod]
|
|
||||||
fn from_string(string: String) -> PyResult<Self> {
|
|
||||||
Ok(Self(Multiaddr::from_str(&string).pyerr()?))
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Return the length in bytes of this multiaddress.
|
|
||||||
fn len(&self) -> usize {
|
|
||||||
self.0.len()
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Returns true if the length of this multiaddress is 0.
|
|
||||||
fn is_empty(&self) -> bool {
|
|
||||||
self.0.is_empty()
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Return a copy of this [`Multiaddr`]'s byte representation.
|
|
||||||
fn to_bytes<'py>(&self, py: Python<'py>) -> Bound<'py, PyBytes> {
|
|
||||||
let bytes = self.0.to_vec();
|
|
||||||
PyBytes::new(py, &bytes)
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Convert a Multiaddr to a string.
|
|
||||||
fn to_string(&self) -> String {
|
|
||||||
self.0.to_string()
|
|
||||||
}
|
|
||||||
|
|
||||||
#[gen_stub(skip)]
|
|
||||||
fn __repr__(&self) -> String {
|
|
||||||
format!("Multiaddr({})", self.0)
|
|
||||||
}
|
|
||||||
|
|
||||||
#[gen_stub(skip)]
|
|
||||||
fn __str__(&self) -> String {
|
|
||||||
self.to_string()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn multiaddr_submodule(m: &Bound<'_, PyModule>) -> PyResult<()> {
|
|
||||||
m.add_class::<PyMultiaddr>()?;
|
|
||||||
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
@@ -22,7 +22,7 @@ delegate = { workspace = true }
|
|||||||
|
|
||||||
# async
|
# async
|
||||||
tokio = { workspace = true, features = ["full"] }
|
tokio = { workspace = true, features = ["full"] }
|
||||||
futures = { workspace = true }
|
futures-lite = { workspace = true }
|
||||||
futures-timer = { workspace = true }
|
futures-timer = { workspace = true }
|
||||||
|
|
||||||
# utility dependencies
|
# utility dependencies
|
||||||
|
|||||||
@@ -1,4 +1,4 @@
|
|||||||
use futures::stream::StreamExt as _;
|
use futures_lite::StreamExt;
|
||||||
use libp2p::{gossipsub, identity, swarm::SwarmEvent};
|
use libp2p::{gossipsub, identity, swarm::SwarmEvent};
|
||||||
use networking::{discovery, swarm};
|
use networking::{discovery, swarm};
|
||||||
use tokio::{io, io::AsyncBufReadExt as _, select};
|
use tokio::{io, io::AsyncBufReadExt as _, select};
|
||||||
@@ -38,19 +38,19 @@ async fn main() {
|
|||||||
println!("Publish error: {e:?}");
|
println!("Publish error: {e:?}");
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
event = swarm.select_next_some() => match event {
|
event = swarm.next() => match event {
|
||||||
// on gossipsub incoming
|
// on gossipsub incoming
|
||||||
SwarmEvent::Behaviour(swarm::BehaviourEvent::Gossipsub(gossipsub::Event::Message {
|
Some(SwarmEvent::Behaviour(swarm::BehaviourEvent::Gossipsub(gossipsub::Event::Message {
|
||||||
propagation_source: peer_id,
|
propagation_source: peer_id,
|
||||||
message_id: id,
|
message_id: id,
|
||||||
message,
|
message,
|
||||||
})) => println!(
|
}))) => println!(
|
||||||
"\n\nGot message: '{}' with id: {id} from peer: {peer_id}\n\n",
|
"\n\nGot message: '{}' with id: {id} from peer: {peer_id}\n\n",
|
||||||
String::from_utf8_lossy(&message.data),
|
String::from_utf8_lossy(&message.data),
|
||||||
),
|
),
|
||||||
|
|
||||||
// on discovery
|
// on discovery
|
||||||
SwarmEvent::Behaviour(swarm::BehaviourEvent::Discovery(e)) => match e {
|
Some(SwarmEvent::Behaviour(swarm::BehaviourEvent::Discovery(e)) )=> match e {
|
||||||
discovery::Event::ConnectionEstablished {
|
discovery::Event::ConnectionEstablished {
|
||||||
peer_id, connection_id, remote_ip, remote_tcp_port
|
peer_id, connection_id, remote_ip, remote_tcp_port
|
||||||
} => {
|
} => {
|
||||||
@@ -64,7 +64,7 @@ async fn main() {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// ignore outgoing errors: those are normal
|
// ignore outgoing errors: those are normal
|
||||||
e@SwarmEvent::OutgoingConnectionError { .. } => { log::debug!("Outgoing connection error: {e:?}"); }
|
e@Some(SwarmEvent::OutgoingConnectionError { .. }) => { log::debug!("Outgoing connection error: {e:?}"); }
|
||||||
|
|
||||||
// otherwise log any other event
|
// otherwise log any other event
|
||||||
e => { log::info!("Other event {e:?}"); }
|
e => { log::info!("Other event {e:?}"); }
|
||||||
|
|||||||
@@ -1,127 +0,0 @@
|
|||||||
// Copyright 2018 Parity Technologies (UK) Ltd.
|
|
||||||
//
|
|
||||||
// Permission is hereby granted, free of charge, to any person obtaining a
|
|
||||||
// copy of this software and associated documentation files (the "Software"),
|
|
||||||
// to deal in the Software without restriction, including without limitation
|
|
||||||
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
||||||
// and/or sell copies of the Software, and to permit persons to whom the
|
|
||||||
// Software is furnished to do so, subject to the following conditions:
|
|
||||||
//
|
|
||||||
// The above copyright notice and this permission notice shall be included in
|
|
||||||
// all copies or substantial portions of the Software.
|
|
||||||
//
|
|
||||||
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
|
||||||
// OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
||||||
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
||||||
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
||||||
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
||||||
// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
||||||
// DEALINGS IN THE SOFTWARE.
|
|
||||||
|
|
||||||
use futures::stream::StreamExt;
|
|
||||||
use libp2p::{
|
|
||||||
gossipsub, mdns, noise,
|
|
||||||
swarm::{NetworkBehaviour, SwarmEvent},
|
|
||||||
tcp, yamux,
|
|
||||||
};
|
|
||||||
use std::error::Error;
|
|
||||||
use std::time::Duration;
|
|
||||||
use tokio::{io, io::AsyncBufReadExt, select};
|
|
||||||
use tracing_subscriber::EnvFilter;
|
|
||||||
|
|
||||||
// We create a custom network behaviour that combines Gossipsub and Mdns.
|
|
||||||
#[derive(NetworkBehaviour)]
|
|
||||||
struct MyBehaviour {
|
|
||||||
gossipsub: gossipsub::Behaviour,
|
|
||||||
mdns: mdns::tokio::Behaviour,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[tokio::main]
|
|
||||||
async fn main() -> Result<(), Box<dyn Error>> {
|
|
||||||
let _ = tracing_subscriber::fmt()
|
|
||||||
.with_env_filter(EnvFilter::from_default_env())
|
|
||||||
.try_init();
|
|
||||||
|
|
||||||
let mut swarm = libp2p::SwarmBuilder::with_new_identity()
|
|
||||||
.with_tokio()
|
|
||||||
.with_tcp(
|
|
||||||
tcp::Config::default(),
|
|
||||||
noise::Config::new,
|
|
||||||
yamux::Config::default,
|
|
||||||
)?
|
|
||||||
.with_behaviour(|key| {
|
|
||||||
// Set a custom gossipsub configuration
|
|
||||||
let gossipsub_config = gossipsub::ConfigBuilder::default()
|
|
||||||
.heartbeat_interval(Duration::from_secs(10))
|
|
||||||
.validation_mode(gossipsub::ValidationMode::Strict) // This sets the kind of message validation. The default is Strict (enforce message signing)
|
|
||||||
.build()
|
|
||||||
.map_err(io::Error::other)?; // Temporary hack because `build` does not return a proper `std::error::Error`.
|
|
||||||
|
|
||||||
// build a gossipsub network behaviour
|
|
||||||
let gossipsub = gossipsub::Behaviour::new(
|
|
||||||
gossipsub::MessageAuthenticity::Signed(key.clone()),
|
|
||||||
gossipsub_config,
|
|
||||||
)?;
|
|
||||||
|
|
||||||
let mdns =
|
|
||||||
mdns::tokio::Behaviour::new(mdns::Config::default(), key.public().to_peer_id())?;
|
|
||||||
Ok(MyBehaviour { gossipsub, mdns })
|
|
||||||
})?
|
|
||||||
.build();
|
|
||||||
|
|
||||||
println!("Running swarm with identity {}", swarm.local_peer_id());
|
|
||||||
|
|
||||||
// Create a Gossipsub topic
|
|
||||||
let topic = gossipsub::IdentTopic::new("test-net");
|
|
||||||
// subscribes to our topic
|
|
||||||
swarm.behaviour_mut().gossipsub.subscribe(&topic)?;
|
|
||||||
|
|
||||||
// Read full lines from stdin
|
|
||||||
let mut stdin = io::BufReader::new(io::stdin()).lines();
|
|
||||||
|
|
||||||
// Listen on all interfaces and whatever port the OS assigns
|
|
||||||
swarm.listen_on("/ip4/0.0.0.0/tcp/0".parse()?)?;
|
|
||||||
|
|
||||||
println!("Enter messages via STDIN and they will be sent to connected peers using Gossipsub");
|
|
||||||
|
|
||||||
// Kick it off
|
|
||||||
loop {
|
|
||||||
select! {
|
|
||||||
Ok(Some(line)) = stdin.next_line() => {
|
|
||||||
if let Err(e) = swarm
|
|
||||||
.behaviour_mut().gossipsub
|
|
||||||
.publish(topic.clone(), line.as_bytes()) {
|
|
||||||
println!("Publish error: {e:?}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
event = swarm.select_next_some() => match event {
|
|
||||||
SwarmEvent::Behaviour(MyBehaviourEvent::Mdns(mdns::Event::Discovered(list))) => {
|
|
||||||
for (peer_id, multiaddr) in list {
|
|
||||||
println!("mDNS discovered a new peer: {peer_id} on {multiaddr}");
|
|
||||||
swarm.behaviour_mut().gossipsub.add_explicit_peer(&peer_id);
|
|
||||||
}
|
|
||||||
},
|
|
||||||
SwarmEvent::Behaviour(MyBehaviourEvent::Mdns(mdns::Event::Expired(list))) => {
|
|
||||||
for (peer_id, multiaddr) in list {
|
|
||||||
println!("mDNS discover peer has expired: {peer_id} on {multiaddr}");
|
|
||||||
swarm.behaviour_mut().gossipsub.remove_explicit_peer(&peer_id);
|
|
||||||
}
|
|
||||||
},
|
|
||||||
SwarmEvent::Behaviour(MyBehaviourEvent::Gossipsub(gossipsub::Event::Message {
|
|
||||||
propagation_source: peer_id,
|
|
||||||
message_id: id,
|
|
||||||
message,
|
|
||||||
})) => println!(
|
|
||||||
"Got message: '{}' with id: {id} from peer: {peer_id}",
|
|
||||||
String::from_utf8_lossy(&message.data),
|
|
||||||
),
|
|
||||||
SwarmEvent::NewListenAddr { address, .. } => {
|
|
||||||
println!("Local node is listening on {address}");
|
|
||||||
}
|
|
||||||
e => {
|
|
||||||
println!("Other swarm event: {:?}", e);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,7 +1,7 @@
|
|||||||
use crate::ext::MultiaddrExt;
|
use crate::ext::MultiaddrExt;
|
||||||
use delegate::delegate;
|
use delegate::delegate;
|
||||||
use either::Either;
|
use either::Either;
|
||||||
use futures::FutureExt;
|
use futures_lite::FutureExt;
|
||||||
use futures_timer::Delay;
|
use futures_timer::Delay;
|
||||||
use libp2p::core::transport::PortUse;
|
use libp2p::core::transport::PortUse;
|
||||||
use libp2p::core::{ConnectedPoint, Endpoint};
|
use libp2p::core::{ConnectedPoint, Endpoint};
|
||||||
@@ -362,7 +362,7 @@ impl NetworkBehaviour for Behaviour {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// retry connecting to all mDNS peers periodically (fails safely if already connected)
|
// retry connecting to all mDNS peers periodically (fails safely if already connected)
|
||||||
if self.retry_delay.poll_unpin(cx).is_ready() {
|
if self.retry_delay.poll(cx).is_ready() {
|
||||||
for (p, mas) in self.mdns_discovered.clone() {
|
for (p, mas) in self.mdns_discovered.clone() {
|
||||||
for ma in mas {
|
for ma in mas {
|
||||||
self.dial(p, ma)
|
self.dial(p, ma)
|
||||||
|
|||||||
@@ -31,7 +31,7 @@ pub fn create_swarm(keypair: identity::Keypair) -> alias::AnyResult<Swarm> {
|
|||||||
mod transport {
|
mod transport {
|
||||||
use crate::alias;
|
use crate::alias;
|
||||||
use crate::swarm::{NETWORK_VERSION, OVERRIDE_VERSION_ENV_VAR};
|
use crate::swarm::{NETWORK_VERSION, OVERRIDE_VERSION_ENV_VAR};
|
||||||
use futures::{AsyncRead, AsyncWrite};
|
use futures_lite::{AsyncRead, AsyncWrite};
|
||||||
use keccak_const::Sha3_256;
|
use keccak_const::Sha3_256;
|
||||||
use libp2p::core::muxing;
|
use libp2p::core::muxing;
|
||||||
use libp2p::core::transport::Boxed;
|
use libp2p::core::transport::Boxed;
|
||||||
|
|||||||
@@ -1,11 +1,10 @@
|
|||||||
{ inputs, ... }:
|
{ inputs, ... }:
|
||||||
{
|
{
|
||||||
perSystem =
|
perSystem =
|
||||||
{ config, self', inputs', pkgs, lib, ... }:
|
{ inputs', pkgs, lib, ... }:
|
||||||
let
|
let
|
||||||
# Fenix nightly toolchain with all components
|
# Fenix nightly toolchain with all components
|
||||||
fenixPkgs = inputs'.fenix.packages;
|
rustToolchain = inputs'.fenix.packages.stable.withComponents [
|
||||||
rustToolchain = fenixPkgs.complete.withComponents [
|
|
||||||
"cargo"
|
"cargo"
|
||||||
"rustc"
|
"rustc"
|
||||||
"clippy"
|
"clippy"
|
||||||
|
|||||||
@@ -1,2 +0,0 @@
|
|||||||
[toolchain]
|
|
||||||
channel = "nightly"
|
|
||||||
@@ -31,6 +31,7 @@ from exo.shared.types.openai_responses import (
|
|||||||
ResponseOutputText,
|
ResponseOutputText,
|
||||||
ResponsesRequest,
|
ResponsesRequest,
|
||||||
ResponsesResponse,
|
ResponsesResponse,
|
||||||
|
ResponsesStreamEvent,
|
||||||
ResponseTextDeltaEvent,
|
ResponseTextDeltaEvent,
|
||||||
ResponseTextDoneEvent,
|
ResponseTextDoneEvent,
|
||||||
ResponseUsage,
|
ResponseUsage,
|
||||||
@@ -38,6 +39,11 @@ from exo.shared.types.openai_responses import (
|
|||||||
from exo.shared.types.text_generation import InputMessage, TextGenerationTaskParams
|
from exo.shared.types.text_generation import InputMessage, TextGenerationTaskParams
|
||||||
|
|
||||||
|
|
||||||
|
def _format_sse(event: ResponsesStreamEvent) -> str:
|
||||||
|
"""Format a streaming event as an SSE message."""
|
||||||
|
return f"event: {event.type}\ndata: {event.model_dump_json()}\n\n"
|
||||||
|
|
||||||
|
|
||||||
def _extract_content(content: str | list[ResponseContentPart]) -> str:
|
def _extract_content(content: str | list[ResponseContentPart]) -> str:
|
||||||
"""Extract plain text from a content field that may be a string or list of parts."""
|
"""Extract plain text from a content field that may be a string or list of parts."""
|
||||||
if isinstance(content, str):
|
if isinstance(content, str):
|
||||||
@@ -219,13 +225,13 @@ async def generate_responses_stream(
|
|||||||
created_event = ResponseCreatedEvent(
|
created_event = ResponseCreatedEvent(
|
||||||
sequence_number=next(seq), response=initial_response
|
sequence_number=next(seq), response=initial_response
|
||||||
)
|
)
|
||||||
yield f"event: response.created\ndata: {created_event.model_dump_json()}\n\n"
|
yield _format_sse(created_event)
|
||||||
|
|
||||||
# response.in_progress
|
# response.in_progress
|
||||||
in_progress_event = ResponseInProgressEvent(
|
in_progress_event = ResponseInProgressEvent(
|
||||||
sequence_number=next(seq), response=initial_response
|
sequence_number=next(seq), response=initial_response
|
||||||
)
|
)
|
||||||
yield f"event: response.in_progress\ndata: {in_progress_event.model_dump_json()}\n\n"
|
yield _format_sse(in_progress_event)
|
||||||
|
|
||||||
# response.output_item.added
|
# response.output_item.added
|
||||||
initial_item = ResponseMessageItem(
|
initial_item = ResponseMessageItem(
|
||||||
@@ -236,7 +242,7 @@ async def generate_responses_stream(
|
|||||||
item_added = ResponseOutputItemAddedEvent(
|
item_added = ResponseOutputItemAddedEvent(
|
||||||
sequence_number=next(seq), output_index=0, item=initial_item
|
sequence_number=next(seq), output_index=0, item=initial_item
|
||||||
)
|
)
|
||||||
yield f"event: response.output_item.added\ndata: {item_added.model_dump_json()}\n\n"
|
yield _format_sse(item_added)
|
||||||
|
|
||||||
# response.content_part.added
|
# response.content_part.added
|
||||||
initial_part = ResponseOutputText(text="")
|
initial_part = ResponseOutputText(text="")
|
||||||
@@ -247,7 +253,7 @@ async def generate_responses_stream(
|
|||||||
content_index=0,
|
content_index=0,
|
||||||
part=initial_part,
|
part=initial_part,
|
||||||
)
|
)
|
||||||
yield f"event: response.content_part.added\ndata: {part_added.model_dump_json()}\n\n"
|
yield _format_sse(part_added)
|
||||||
|
|
||||||
accumulated_text = ""
|
accumulated_text = ""
|
||||||
function_call_items: list[ResponseFunctionCallItem] = []
|
function_call_items: list[ResponseFunctionCallItem] = []
|
||||||
@@ -281,7 +287,7 @@ async def generate_responses_stream(
|
|||||||
output_index=next_output_index,
|
output_index=next_output_index,
|
||||||
item=fc_item,
|
item=fc_item,
|
||||||
)
|
)
|
||||||
yield f"event: response.output_item.added\ndata: {fc_added.model_dump_json()}\n\n"
|
yield _format_sse(fc_added)
|
||||||
|
|
||||||
# response.function_call_arguments.delta
|
# response.function_call_arguments.delta
|
||||||
args_delta = ResponseFunctionCallArgumentsDeltaEvent(
|
args_delta = ResponseFunctionCallArgumentsDeltaEvent(
|
||||||
@@ -290,7 +296,7 @@ async def generate_responses_stream(
|
|||||||
output_index=next_output_index,
|
output_index=next_output_index,
|
||||||
delta=tool.arguments,
|
delta=tool.arguments,
|
||||||
)
|
)
|
||||||
yield f"event: response.function_call_arguments.delta\ndata: {args_delta.model_dump_json()}\n\n"
|
yield _format_sse(args_delta)
|
||||||
|
|
||||||
# response.function_call_arguments.done
|
# response.function_call_arguments.done
|
||||||
args_done = ResponseFunctionCallArgumentsDoneEvent(
|
args_done = ResponseFunctionCallArgumentsDoneEvent(
|
||||||
@@ -300,7 +306,7 @@ async def generate_responses_stream(
|
|||||||
name=tool.name,
|
name=tool.name,
|
||||||
arguments=tool.arguments,
|
arguments=tool.arguments,
|
||||||
)
|
)
|
||||||
yield f"event: response.function_call_arguments.done\ndata: {args_done.model_dump_json()}\n\n"
|
yield _format_sse(args_done)
|
||||||
|
|
||||||
# response.output_item.done
|
# response.output_item.done
|
||||||
fc_done_item = ResponseFunctionCallItem(
|
fc_done_item = ResponseFunctionCallItem(
|
||||||
@@ -315,7 +321,7 @@ async def generate_responses_stream(
|
|||||||
output_index=next_output_index,
|
output_index=next_output_index,
|
||||||
item=fc_done_item,
|
item=fc_done_item,
|
||||||
)
|
)
|
||||||
yield f"event: response.output_item.done\ndata: {fc_item_done.model_dump_json()}\n\n"
|
yield _format_sse(fc_item_done)
|
||||||
|
|
||||||
function_call_items.append(fc_done_item)
|
function_call_items.append(fc_done_item)
|
||||||
next_output_index += 1
|
next_output_index += 1
|
||||||
@@ -331,7 +337,7 @@ async def generate_responses_stream(
|
|||||||
content_index=0,
|
content_index=0,
|
||||||
delta=chunk.text,
|
delta=chunk.text,
|
||||||
)
|
)
|
||||||
yield f"event: response.output_text.delta\ndata: {delta_event.model_dump_json()}\n\n"
|
yield _format_sse(delta_event)
|
||||||
|
|
||||||
# response.output_text.done
|
# response.output_text.done
|
||||||
text_done = ResponseTextDoneEvent(
|
text_done = ResponseTextDoneEvent(
|
||||||
@@ -341,7 +347,7 @@ async def generate_responses_stream(
|
|||||||
content_index=0,
|
content_index=0,
|
||||||
text=accumulated_text,
|
text=accumulated_text,
|
||||||
)
|
)
|
||||||
yield f"event: response.output_text.done\ndata: {text_done.model_dump_json()}\n\n"
|
yield _format_sse(text_done)
|
||||||
|
|
||||||
# response.content_part.done
|
# response.content_part.done
|
||||||
final_part = ResponseOutputText(text=accumulated_text)
|
final_part = ResponseOutputText(text=accumulated_text)
|
||||||
@@ -352,7 +358,7 @@ async def generate_responses_stream(
|
|||||||
content_index=0,
|
content_index=0,
|
||||||
part=final_part,
|
part=final_part,
|
||||||
)
|
)
|
||||||
yield f"event: response.content_part.done\ndata: {part_done.model_dump_json()}\n\n"
|
yield _format_sse(part_done)
|
||||||
|
|
||||||
# response.output_item.done
|
# response.output_item.done
|
||||||
final_message_item = ResponseMessageItem(
|
final_message_item = ResponseMessageItem(
|
||||||
@@ -363,7 +369,7 @@ async def generate_responses_stream(
|
|||||||
item_done = ResponseOutputItemDoneEvent(
|
item_done = ResponseOutputItemDoneEvent(
|
||||||
sequence_number=next(seq), output_index=0, item=final_message_item
|
sequence_number=next(seq), output_index=0, item=final_message_item
|
||||||
)
|
)
|
||||||
yield f"event: response.output_item.done\ndata: {item_done.model_dump_json()}\n\n"
|
yield _format_sse(item_done)
|
||||||
|
|
||||||
# Create usage from usage data if available
|
# Create usage from usage data if available
|
||||||
usage = None
|
usage = None
|
||||||
@@ -388,4 +394,4 @@ async def generate_responses_stream(
|
|||||||
completed_event = ResponseCompletedEvent(
|
completed_event = ResponseCompletedEvent(
|
||||||
sequence_number=next(seq), response=final_response
|
sequence_number=next(seq), response=final_response
|
||||||
)
|
)
|
||||||
yield f"event: response.completed\ndata: {completed_event.model_dump_json()}\n\n"
|
yield _format_sse(completed_event)
|
||||||
|
|||||||
@@ -241,6 +241,11 @@ class Worker:
|
|||||||
cancelled_task_id=cancelled_task_id, runner_id=runner_id
|
cancelled_task_id=cancelled_task_id, runner_id=runner_id
|
||||||
):
|
):
|
||||||
await self.runners[runner_id].cancel_task(cancelled_task_id)
|
await self.runners[runner_id].cancel_task(cancelled_task_id)
|
||||||
|
await self.event_sender.send(
|
||||||
|
TaskStatusUpdated(
|
||||||
|
task_id=task.task_id, task_status=TaskStatus.Complete
|
||||||
|
)
|
||||||
|
)
|
||||||
case ImageEdits() if task.task_params.total_input_chunks > 0:
|
case ImageEdits() if task.task_params.total_input_chunks > 0:
|
||||||
# Assemble image from chunks and inject into task
|
# Assemble image from chunks and inject into task
|
||||||
cmd_id = task.command_id
|
cmd_id = task.command_id
|
||||||
|
|||||||
Reference in New Issue
Block a user