25 lines
755 B
TOML
25 lines
755 B
TOML
[package]
|
|
name = "candle-flash-attn"
|
|
version = "0.2.2"
|
|
edition = "2021"
|
|
|
|
description = "Flash attention layer for the candle ML framework."
|
|
repository = "https://github.com/huggingface/candle"
|
|
keywords = ["blas", "tensor", "machine-learning"]
|
|
categories = ["science"]
|
|
license = "MIT OR Apache-2.0"
|
|
readme = "README.md"
|
|
|
|
[dependencies]
|
|
candle = { path = "../candle-core", features = ["cuda"], version = "0.2.2", package = "candle-core" }
|
|
half = { version = "2.3.1", features = ["num-traits"] }
|
|
|
|
[build-dependencies]
|
|
anyhow = { version = "1", features = ["backtrace"] }
|
|
num_cpus = "1.15.0"
|
|
rayon = "1.7.0"
|
|
|
|
[dev-dependencies]
|
|
anyhow = { version = "1", features = ["backtrace"] }
|
|
candle-nn = { path = "../candle-nn", version = "0.2.2", features = ["cuda"] }
|