|
19 | 19 | action="store_true", |
20 | 20 | help="default not to keep the container", |
21 | 21 | ) |
| 22 | +group_container.add_argument( |
| 23 | + "--shm-size", |
| 24 | + type=str, |
| 25 | + required=False, |
| 26 | + help="default to half of the RAM size", |
| 27 | +) |
22 | 28 |
|
23 | 29 | group_server = args.add_argument_group("server") |
24 | | -group_server.add_argument("-m", "--model", type=str, required=True) |
| 30 | +group_server.add_argument( |
| 31 | + "-m", "--model", type=str, required=True, help="path to model dir" |
| 32 | +) |
25 | 33 | group_server.add_argument("-p", "--port", type=int, default=8080) |
26 | | -group_server.add_argument("-n", "--num-nodes", type=int, default=1) |
| 34 | +group_server.add_argument( |
| 35 | + "-n", "--num-proc", type=int, default=1, help="number of process/gpus" |
| 36 | +) |
27 | 37 | group_server.add_argument("-mt", "--max-total-tokens", type=int, default=4096) |
28 | 38 | args = args.parse_args() |
29 | 39 |
|
30 | 40 | model_path = os.path.abspath(args.model) |
| 41 | +shm_size = ( |
| 42 | + args.shm_size |
| 43 | + if args.shm_size |
| 44 | + else (os.sysconf("SC_PAGE_SIZE") * os.sysconf("SC_PHYS_PAGES") // 2) |
| 45 | +) |
31 | 46 |
|
32 | | -print(args) |
33 | 47 | launch_args = [ |
34 | 48 | "docker", |
35 | 49 | "run", |
|
40 | 54 | f"{args.port}:{args.port}", |
41 | 55 | "-v", |
42 | 56 | f"{model_path}:{model_path}", |
| 57 | + "--shm-size", |
| 58 | + str(shm_size), |
43 | 59 | ] |
44 | 60 | if args.name: |
45 | 61 | launch_args.extend(["--name", args.name]) |
|
61 | 77 | "--port", |
62 | 78 | args.port, |
63 | 79 | "--tp", |
64 | | - args.num_nodes, |
| 80 | + args.num_proc, |
65 | 81 | ] |
66 | 82 | ) |
| 83 | + |
67 | 84 | launch_args = list(map(str, launch_args)) |
68 | 85 | print(f'launching: {" ".join(launch_args)}') |
69 | 86 | os.execvp(launch_args[0], launch_args) |
0 commit comments