Browse Source

add missing top_p_sampling import

Alex Cheema 7 months ago
parent
commit
6659a18e94
1 changed files with 1 additions and 0 deletions
  1. 1 0
      exo/inference/mlx/sharded_inference_engine.py

+ 1 - 0
exo/inference/mlx/sharded_inference_engine.py

@@ -1,6 +1,7 @@
 import numpy as np
 import mlx.core as mx
 import mlx.nn as nn
+from mlx_lm.sample_utils import top_p_sampling
 from ..inference_engine import InferenceEngine
 from .stateful_model import StatefulModel
 from .sharded_utils import load_shard