API_PORT=8080
COMPILE=1
HALF=1
PYTORCH_CUDA_ALLOC_CONF=max_split_size_mb:64,expandable_segments:True