neural-os

Runtime error

da03 commited on Jul 13

Commit

64a144d

1 Parent(s): 888f299

.

Files changed (4) hide show

dispatcher.py CHANGED Viewed

@@ -1210,7 +1210,7 @@ if __name__ == "__main__":
     import argparse
     parser = argparse.ArgumentParser(description="Dispatcher for Neural OS")
-    parser.add_argument("--port", type=int, default=8000, help="Port to run the dispatcher on")
     args = parser.parse_args()
     logger.info(f"🌐 Starting dispatcher on 0.0.0.0:{args.port}")

     import argparse
     parser = argparse.ArgumentParser(description="Dispatcher for Neural OS")
+    parser.add_argument("--port", type=int, default=7860, help="Port to run the dispatcher on")
     args = parser.parse_args()
     logger.info(f"🌐 Starting dispatcher on 0.0.0.0:{args.port}")

start_system.sh CHANGED Viewed

@@ -148,7 +148,7 @@ echo "✅ Dispatcher started (PID: $DISPATCHER_PID)"
 # Start workers
 echo "🔧 Starting $NUM_GPUS GPU workers..."
-python start_workers.py --num-gpus $NUM_GPUS --no-monitor > workers.log 2>&1
 WORKER_START_EXIT_CODE=$?
 # Wait for workers to fully load models and register (60 seconds)

 # Start workers
 echo "🔧 Starting $NUM_GPUS GPU workers..."
+python start_workers.py --num-gpus $NUM_GPUS --dispatcher-url "http://localhost:$DISPATCHER_PORT" --no-monitor > workers.log 2>&1
 WORKER_START_EXIT_CODE=$?
 # Wait for workers to fully load models and register (60 seconds)

start_workers.py CHANGED Viewed

@@ -13,7 +13,7 @@ import os
 from typing import List
 class WorkerManager:
-    def __init__(self, num_gpus: int, dispatcher_url: str = "http://localhost:8000"):
         self.num_gpus = num_gpus
         self.dispatcher_url = dispatcher_url
         self.processes: List[subprocess.Popen] = []
@@ -143,7 +143,7 @@ def main():
     parser = argparse.ArgumentParser(description="Start multiple GPU workers")
     parser.add_argument("--num-gpus", type=int, required=True,
                        help="Number of GPU workers to start")
-    parser.add_argument("--dispatcher-url", type=str, default="http://localhost:8000",
                        help="URL of the dispatcher service")
     parser.add_argument("--no-monitor", action="store_true",
                        help="Start workers but don't monitor them")

 from typing import List
 class WorkerManager:
+    def __init__(self, num_gpus: int, dispatcher_url: str = "http://localhost:7860"):
         self.num_gpus = num_gpus
         self.dispatcher_url = dispatcher_url
         self.processes: List[subprocess.Popen] = []
     parser = argparse.ArgumentParser(description="Start multiple GPU workers")
     parser.add_argument("--num-gpus", type=int, required=True,
                        help="Number of GPU workers to start")
+    parser.add_argument("--dispatcher-url", type=str, default="http://localhost:7860",
                        help="URL of the dispatcher service")
     parser.add_argument("--no-monitor", action="store_true",
                        help="Start workers but don't monitor them")

worker.py CHANGED Viewed

@@ -27,7 +27,7 @@ torch.backends.cuda.matmul.allow_tf32 = True
 torch.backends.cudnn.allow_tf32 = True
 class GPUWorker:
-    def __init__(self, worker_address: str, dispatcher_url: str = "http://localhost:8000"):
         self.worker_address = worker_address  # e.g., "localhost:8001", "192.168.1.100:8002"
         # Parse port from worker address
         if ':' in worker_address:
@@ -771,7 +771,7 @@ if __name__ == "__main__":
     # Parse command line arguments
     parser = argparse.ArgumentParser(description="GPU Worker for Neural OS")
     parser.add_argument("--worker-address", type=str, required=True, help="Worker address (e.g., 'localhost:8001', '192.168.1.100:8002')")
-    parser.add_argument("--dispatcher-url", type=str, default="http://localhost:8000", help="Dispatcher URL")
     args = parser.parse_args()
     # Parse port from worker address for validation

 torch.backends.cudnn.allow_tf32 = True
 class GPUWorker:
+    def __init__(self, worker_address: str, dispatcher_url: str = "http://localhost:7860"):
         self.worker_address = worker_address  # e.g., "localhost:8001", "192.168.1.100:8002"
         # Parse port from worker address
         if ':' in worker_address:
     # Parse command line arguments
     parser = argparse.ArgumentParser(description="GPU Worker for Neural OS")
     parser.add_argument("--worker-address", type=str, required=True, help="Worker address (e.g., 'localhost:8001', '192.168.1.100:8002')")
+    parser.add_argument("--dispatcher-url", type=str, default="http://localhost:7860", help="Dispatcher URL")
     args = parser.parse_args()
     # Parse port from worker address for validation