Add the layer norm files. (#222)

This commit is contained in:
Laurent Mazare
2023-07-22 16:06:35 +02:00
committed by GitHub
parent 1f26042693
commit c8459d199d
9 changed files with 1532 additions and 0 deletions

View File

@ -184,6 +184,7 @@ mod cuda {
let mut command = std::process::Command::new("nvcc");
command.arg(format!("--gpu-architecture=sm_{compute_cap}"))
.arg("--ptx")
.arg("--expt-relaxed-constexpr")
.args(["--default-stream", "per-thread"])
.args(["--output-directory", &out_dir])
// Flash attention only