-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy path.env.example
More file actions
34 lines (28 loc) · 969 Bytes
/
.env.example
File metadata and controls
34 lines (28 loc) · 969 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
# Build configuration
TORCH_CUDA_ARCH_LIST=80;90
CUDA_HOME=/usr/local/cuda
CUDA_CACHE_PATH=${HOME}/.cache/stream_attn/cuda
TRITON_CACHE_DIR=${HOME}/.cache/stream_attn/triton
# StreamAttention environment configuration example
# Build configuration
TORCH_CUDA_ARCH_LIST=80;90
CUDA_HOME=/usr/local/cuda
CUDA_CACHE_PATH=${HOME}/.cache/stream_attn/cuda
TRITON_CACHE_DIR=${HOME}/.cache/stream_attn/triton
# StreamAttention environment configuration example
# Copy to .env and edit as needed
STREAM_ATTENTION_NUM_HEADS=32
STREAM_ATTENTION_HEAD_DIM=128
STREAM_ATTENTION_TILE_Q=128
STREAM_ATTENTION_TILE_K=64
STREAM_ATTENTION_MAX_SEQ_LEN=65536
# Optional features
STREAM_ATTENTION_ENABLE_KV_COMPRESSION=true
STREAM_ATTENTION_KV_COMPRESSION_RATIO=4.0
# Ring Attention
STREAM_ATTENTION_RING_BLOCK_SIZE=2048
STREAM_ATTENTION_RING_OVERLAP_SIZE=256
# Star Attention
STREAM_ATTENTION_STAR_BLOCK_SIZE=2048
STREAM_ATTENTION_STAR_ANCHOR_SIZE=256
STREAM_ATTENTION_STAR_NUM_HOSTS=1