baste Basten7

On every machine in the cluster install openmpi and mlx-lm:

conda install conda-forge::openmpi
pip install -U mlx-lm

Next download the pipeline parallel run script. Download it to the same path on every machine:

	#import "ggml-metal.h"

	#import "ggml-impl.h"
	#import "ggml-backend-impl.h"
	#import "ggml-metal-impl.h"

	#import <Foundation/Foundation.h>

	#import <Metal/Metal.h>

	import argparse
	import math
	import mlx.core as mx
	import mlx.nn as nn
	from tqdm import tqdm
	from mlx_lm.utils import load
	from pathlib import Path


	def eval_ppl(model, data, batch_size=32):