[WIP] PTQ for generate_v2
#1866
Dr.CI classification results
{"FAILED":[{"workflowId":11411027807,"workflowUniqueId":103397641,"id":31754517178,"runnerName":"i-031be088ab34a3862","authorEmail":"jrcummings27@gmail.com","name":"GPU tests / gpu_test (3.9, stable)","jobName":"gpu_test (3.9, stable)","conclusion":"cancelled","completed_at":"2024-10-18T22:17:55.000000000Z","html_url":"https://github.com/pytorch/torchtune/actions/runs/11411027807/job/31754517178","head_branch":"add-quantize-generate-v2","pr_number":1866,"head_sha":"eafd3b294c305f81c0aaba374ac27de4d59e26a3","head_sha_timestamp":"2024-10-18T21:06:48Z","failure_captures":[],"failure_lines":[],"failure_context":[],"time":"2024-10-18T21:07:01.000000000Z"},{"workflowId":11411027807,"workflowUniqueId":103397641,"id":31754517476,"runnerName":"i-047a4d9399c363f36","authorEmail":"jrcummings27@gmail.com","name":"GPU tests / gpu_test (3.10, stable)","jobName":"gpu_test (3.10, stable)","conclusion":"failure","completed_at":"2024-10-18T22:17:30.000000000Z","html_url":"https://github.com/pytorch/torchtune/actions/runs/11411027807/job/31754517476","head_branch":"add-quantize-generate-v2","pr_number":1866,"head_sha":"eafd3b294c305f81c0aaba374ac27de4d59e26a3","head_sha_timestamp":"2024-10-18T21:06:48Z","failure_captures":["tests/recipes/dev/test_generate_v2.py::TestGenerateV2::test_llama2_generate_with_quantization"],"failure_lines":["FAILED tests/recipes/dev/test_generate_v2.py::TestGenerateV2::test_llama2_generate_with_quantization - RuntimeError: CUDA error: named symbol not found"],"failure_context":[],"time":"2024-10-18T21:07:01.000000000Z"},{"workflowId":11411027807,"workflowUniqueId":103397641,"id":31754517726,"runnerName":"i-0fc40590676f3eb06","authorEmail":"jrcummings27@gmail.com","name":"GPU tests / gpu_test (3.11, stable)","jobName":"gpu_test (3.11, stable)","conclusion":"cancelled","completed_at":"2024-10-18T22:17:57.000000000Z","html_url":"https://github.com/pytorch/torchtune/actions/runs/11411027807/job/31754517726","head_branch":"add-quantize-generate-v2","pr_number":1866,"head_sha":"eafd3b294c305f81c0aaba374ac27de4d59e26a3","head_sha_timestamp":"2024-10-18T21:06:48Z","failure_captures":["##[error]The operation was canceled."],"failure_lines":["##[error]The operation was canceled."],"failure_context":[],"time":"2024-10-18T21:07:02.000000000Z"}],"FLAKY":[],"BROKEN_TRUNK":[],"UNSTABLE":[]}