|
17 | 17 | from ramalama.kube import Kube |
18 | 18 | from ramalama.model_inspect import GGUFModelInfo, ModelInfoBase |
19 | 19 | from ramalama.quadlet import Quadlet |
| 20 | +from ramalama.kserve import Kserve |
20 | 21 | from ramalama.version import version |
21 | 22 |
|
22 | 23 | MODEL_TYPES = ["file", "https", "http", "oci", "huggingface", "hf", "ollama"] |
@@ -360,7 +361,6 @@ def get_model_path(self, args): |
360 | 361 |
|
361 | 362 | if args.dryrun: |
362 | 363 | return "/path/to/model" |
363 | | - |
364 | 364 | model_path = self.pull(args) |
365 | 365 |
|
366 | 366 | return model_path |
@@ -486,16 +486,15 @@ def handle_runtime(self, args, exec_args, exec_model_path): |
486 | 486 |
|
487 | 487 | def generate_container_config(self, model_path, args, exec_args): |
488 | 488 | self.image = self._image(args) |
| 489 | + if args.generate == "kserve": |
| 490 | + return self.kserve(model_path, args, exec_args) |
489 | 491 | if args.generate == "quadlet": |
490 | | - self.quadlet(model_path, args, exec_args) |
491 | | - elif args.generate == "kube": |
492 | | - self.kube(model_path, args, exec_args) |
493 | | - elif args.generate == "quadlet/kube": |
494 | | - self.quadlet_kube(model_path, args, exec_args) |
495 | | - else: |
496 | | - return False |
497 | | - |
498 | | - return True |
| 492 | + return self.quadlet(model_path, args, exec_args) |
| 493 | + if args.generate == "kube": |
| 494 | + return self.kube(model_path, args, exec_args) |
| 495 | + if args.generate == "quadlet/kube": |
| 496 | + return self.quadlet_kube(model_path, args, exec_args) |
| 497 | + return False |
499 | 498 |
|
500 | 499 | def execute_command(self, model_path, exec_args, args): |
501 | 500 | try: |
@@ -526,19 +525,27 @@ def serve(self, args): |
526 | 525 |
|
527 | 526 | self.execute_command(model_path, exec_args, args) |
528 | 527 |
|
| 528 | + def kserve(self, model, args, exec_args): |
| 529 | + kserve = Kserve(model, self.image, args, exec_args) |
| 530 | + kserve.generate() |
| 531 | + return True |
| 532 | + |
529 | 533 | def quadlet(self, model, args, exec_args): |
530 | 534 | quadlet = Quadlet(model, self.image, args, exec_args) |
531 | 535 | quadlet.generate() |
| 536 | + return True |
532 | 537 |
|
533 | 538 | def quadlet_kube(self, model, args, exec_args): |
534 | 539 | kube = Kube(model, self.image, args, exec_args) |
535 | 540 | kube.generate() |
536 | 541 | quadlet = Quadlet(model, self.image, args, exec_args) |
537 | 542 | quadlet.kube() |
| 543 | + return True |
538 | 544 |
|
539 | 545 | def kube(self, model, args, exec_args): |
540 | 546 | kube = Kube(model, self.image, args, exec_args) |
541 | 547 | kube.generate() |
| 548 | + return True |
542 | 549 |
|
543 | 550 | def path(self, args): |
544 | 551 | return self.model_path(args) |
|
0 commit comments