Searched refs:model_parallel_size (Results 1 – 2 of 2) sorted by relevance
271 model_parallel_size = 1272 self.n_local_heads = self.n_heads // model_parallel_size273 self.n_local_kv_heads = self.n_kv_heads // model_parallel_size
392 def init_model(self, device_type, model_parallel_size=2): argument403 (world_size // model_parallel_size, model_parallel_size),