chore: formatting powerinfer Python code

SJTU-IPADS · Apr 8, 2024 · 5b4c22b · 5b4c22b
1 parent 3d90d1f
commit 5b4c22b
Show file tree

Hide file tree

Showing 3 changed files with 3 additions and 9 deletions.
diff --git a/powerinfer-py/powerinfer/__main__.py b/powerinfer-py/powerinfer/__main__.py
@@ -1,4 +1,3 @@
-
 import argparse
 
 from .solver import solve_gpu_split
@@ -10,8 +9,8 @@
     # Set up command line arguments
     parser = argparse.ArgumentParser(description='Optimize neuron activation based on VRAM capacity and other parameters.')
     parser.add_argument('--activation', type=str, required=True, help='Path to the directory containing activation data.')
-    parser.add_argument('--neuron', type=int, default=8192*4, help='Total number of neurons in the network.')
-    parser.add_argument('--capacity', type=int, default=int(8192*4*32*0.1), help='Total VRAM capacity for the model.')
+    parser.add_argument('--neuron', type=int, default=8192*4, help='Total number of neurons in each layer.')
+    parser.add_argument('--capacity', type=int, help='Max neurons that can be stored in VRAM.')
     parser.add_argument('--layer', type=int, default=59, help='Total number of layers in the neural network.')
     parser.add_argument('--vram-capacity', type=int, help='Total VRAM capacity (Bytes) available for splitting')
     parser.add_argument('--batch', type=int, default=256, help='Batch size for processing.')

diff --git a/powerinfer-py/powerinfer/export_split.py b/powerinfer-py/powerinfer/export_split.py
@@ -1,5 +1,3 @@
-import argparse
-import pickle
 import gguf
 from gguf.constants import GGMLQuantizationType
 from gguf.gguf_writer import GGUFWriter
@@ -10,6 +8,7 @@
 import numpy as np
 import re
 
+
 def load_activation_weights(models_base: Path):
     # TODO: might need a specification file to indicate which models to load.
     # But for now, let's assume it is a plain directory of activation_{0, ... , n_layers - 1}.pt

diff --git a/powerinfer-py/powerinfer/solver.py b/powerinfer-py/powerinfer/solver.py
@@ -1,11 +1,7 @@
-#!/usr/bin/env python
-# coding=utf-8
-import argparse
 from cvxopt.glpk import ilp
 import numpy as np
 from cvxopt import matrix
 import torch
-import pickle
 
 def solve_gpu_split(
     activation_path: str,