{ lib
, buildPythonPackage
, fetchPypi
, setuptools
, attrs
, numpy
, pulp
, torch
, tqdm
, transformers
}:

buildPythonPackage rec {
  pname = "flexgen";
  version = "0.1.7";
  format = "pyproject";

  src = fetchPypi {
    inherit pname version;
    hash = "sha256-GYnl5CYsMWgTdbCfhWcNyjtpnHCXAcYWtMUmAJcRQAM=";
  };

  nativeBuildInputs = [
    setuptools
  ];

  propagatedBuildInputs = [
    attrs
    numpy
    pulp
    torch
    tqdm
    transformers
  ];

  pythonImportsCheck = [ "flexgen" ];

  meta = with lib; {
    description = "Running large language models like OPT-175B/GPT-3 on a single GPU. Focusing on high-throughput large-batch generation";
    homepage = "https://github.com/FMInference/FlexGen";
    license = licenses.asl20;
    maintainers = with maintainers; [ jpetrucciani ];
  };
}