gpu: ["A40", "A100"] task: ["chat", "chat-concise", "instruct", "instruct-concise"]