wip(ci): debug the ci

This commit is contained in:
Baptiste Colle 2025-04-10 17:17:16 +02:00 committed by baptiste
parent d2b23a1ec5
commit 2821274a88

View File

@ -5,26 +5,26 @@ import pytest
# The "args" values in TEST_CONFIGS are not optimized for speed but only check that the inference is working for the different models architectures. # The "args" values in TEST_CONFIGS are not optimized for speed but only check that the inference is working for the different models architectures.
TEST_CONFIGS = { TEST_CONFIGS = {
"meta-llama/Llama-3.1-8B-Instruct-shared": { # "meta-llama/Llama-3.1-8B-Instruct-shared": {
"model_id": "meta-llama/Llama-3.1-8B-Instruct", # "model_id": "meta-llama/Llama-3.1-8B-Instruct",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": " A Beginners Guide\nDeep learning is a subset of machine learning that involves the use of artificial neural networks to analyze and interpret data. It is a type of", # "expected_greedy_output": " A Beginners Guide\nDeep learning is a subset of machine learning that involves the use of artificial neural networks to analyze and interpret data. It is a type of",
"expected_batch_output": " A Beginners Guide\nDeep learning is a subset of machine learning that involves the use of artificial neural networks to analyze and interpret data. It is a type of", # "expected_batch_output": " A Beginners Guide\nDeep learning is a subset of machine learning that involves the use of artificial neural networks to analyze and interpret data. It is a type of",
"args": [ # "args": [
"--sharded", # "--sharded",
"true", # "true",
"--num-shard", # "--num-shard",
"8", # "8",
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"8", # "8",
"--max-batch-prefill-tokens", # "--max-batch-prefill-tokens",
"2048", # "2048",
], # ],
}, # },
"meta-llama/Llama-3.1-8B-Instruct": { "meta-llama/Llama-3.1-8B-Instruct": {
"model_id": "meta-llama/Llama-3.1-8B-Instruct", "model_id": "meta-llama/Llama-3.1-8B-Instruct",
"input": "What is Deep Learning?", "input": "What is Deep Learning?",
@ -42,156 +42,156 @@ TEST_CONFIGS = {
"2048", "2048",
], ],
}, },
"meta-llama/Llama-2-7b-chat-hf": { # "meta-llama/Llama-2-7b-chat-hf": {
"model_id": "meta-llama/Llama-2-7b-chat-hf", # "model_id": "meta-llama/Llama-2-7b-chat-hf",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": "\n\nDeep learning (also known as deep structured learning) is part of a broader family of machine learning techniques based on artificial neural networks\u2014specific", # "expected_greedy_output": "\n\nDeep learning (also known as deep structured learning) is part of a broader family of machine learning techniques based on artificial neural networks\u2014specific",
"expected_batch_output": "\n\nDeep learning (also known as deep structured learning) is part of a broader family of machine learning techniques based on artificial neural networks\u2014specific", # "expected_batch_output": "\n\nDeep learning (also known as deep structured learning) is part of a broader family of machine learning techniques based on artificial neural networks\u2014specific",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
"--max-batch-prefill-tokens", # "--max-batch-prefill-tokens",
"2048", # "2048",
], # ],
}, # },
"mistralai/Mistral-7B-Instruct-v0.3": { # "mistralai/Mistral-7B-Instruct-v0.3": {
"model_id": "mistralai/Mistral-7B-Instruct-v0.3", # "model_id": "mistralai/Mistral-7B-Instruct-v0.3",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": "\n\nDeep learning is a subset of machine learning in artificial intelligence (AI) that has networks capable of learning unsupervised from data that is unstructured", # "expected_greedy_output": "\n\nDeep learning is a subset of machine learning in artificial intelligence (AI) that has networks capable of learning unsupervised from data that is unstructured",
"expected_batch_output": "\n\nDeep learning is a subset of machine learning in artificial intelligence (AI) that has networks capable of learning unsupervised from data that is unstructured", # "expected_batch_output": "\n\nDeep learning is a subset of machine learning in artificial intelligence (AI) that has networks capable of learning unsupervised from data that is unstructured",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
"--max-batch-prefill-tokens", # "--max-batch-prefill-tokens",
"2048", # "2048",
], # ],
}, # },
"bigcode/starcoder2-3b": { # "bigcode/starcoder2-3b": {
"model_id": "bigcode/starcoder2-3b", # "model_id": "bigcode/starcoder2-3b",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": "\n\nDeep learning is a subset of machine learning that uses artificial neural networks to perform tasks.\n\nNeural networks are a type of machine learning algorithm that", # "expected_greedy_output": "\n\nDeep learning is a subset of machine learning that uses artificial neural networks to perform tasks.\n\nNeural networks are a type of machine learning algorithm that",
"expected_batch_output": "\n\nDeep learning is a subset of machine learning that uses artificial neural networks to perform tasks.\n\nNeural networks are a type of machine learning algorithm that", # "expected_batch_output": "\n\nDeep learning is a subset of machine learning that uses artificial neural networks to perform tasks.\n\nNeural networks are a type of machine learning algorithm that",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
"--max-batch-prefill-tokens", # "--max-batch-prefill-tokens",
"2048", # "2048",
], # ],
}, # },
"google/gemma-7b-it": { # "google/gemma-7b-it": {
"model_id": "google/gemma-7b-it", # "model_id": "google/gemma-7b-it",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": "\n\nDeep learning is a subset of machine learning that uses artificial neural networks to learn from large amounts of data. Neural networks are inspired by the structure and function of", # "expected_greedy_output": "\n\nDeep learning is a subset of machine learning that uses artificial neural networks to learn from large amounts of data. Neural networks are inspired by the structure and function of",
"expected_batch_output": "\n\nDeep learning is a subset of machine learning that uses artificial neural networks to learn from large amounts of data. Neural networks are inspired by the structure and function of", # "expected_batch_output": "\n\nDeep learning is a subset of machine learning that uses artificial neural networks to learn from large amounts of data. Neural networks are inspired by the structure and function of",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
"--max-batch-prefill-tokens", # "--max-batch-prefill-tokens",
"2048", # "2048",
], # ],
}, # },
"Qwen/Qwen2-0.5B-Instruct": { # "Qwen/Qwen2-0.5B-Instruct": {
"model_id": "Qwen/Qwen2-0.5B-Instruct", # "model_id": "Qwen/Qwen2-0.5B-Instruct",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": " Deep Learning is a type of machine learning that is based on the principles of artificial neural networks. It is a type of machine learning that is used to train models", # "expected_greedy_output": " Deep Learning is a type of machine learning that is based on the principles of artificial neural networks. It is a type of machine learning that is used to train models",
"expected_batch_output": " Deep Learning is a type of machine learning that is based on the principles of artificial neural networks. It is a type of machine learning that is used to train models", # "expected_batch_output": " Deep Learning is a type of machine learning that is based on the principles of artificial neural networks. It is a type of machine learning that is used to train models",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
"--max-batch-prefill-tokens", # "--max-batch-prefill-tokens",
"2048", # "2048",
], # ],
}, # },
"tiiuae/falcon-7b-instruct": { # "tiiuae/falcon-7b-instruct": {
"model_id": "tiiuae/falcon-7b-instruct", # "model_id": "tiiuae/falcon-7b-instruct",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": "\nDeep learning is a branch of machine learning that uses artificial neural networks to learn and make decisions. It is based on the concept of hierarchical learning, where a", # "expected_greedy_output": "\nDeep learning is a branch of machine learning that uses artificial neural networks to learn and make decisions. It is based on the concept of hierarchical learning, where a",
"expected_batch_output": "\nDeep learning is a branch of machine learning that uses artificial neural networks to learn and make decisions. It is based on the concept of hierarchical learning, where a", # "expected_batch_output": "\nDeep learning is a branch of machine learning that uses artificial neural networks to learn and make decisions. It is based on the concept of hierarchical learning, where a",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
], # ],
}, # },
"microsoft/phi-1_5": { # "microsoft/phi-1_5": {
"model_id": "microsoft/phi-1_5", # "model_id": "microsoft/phi-1_5",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": "\n\nDeep Learning is a subfield of Machine Learning that focuses on building neural networks with multiple layers of interconnected nodes. These networks are designed to learn from large", # "expected_greedy_output": "\n\nDeep Learning is a subfield of Machine Learning that focuses on building neural networks with multiple layers of interconnected nodes. These networks are designed to learn from large",
"expected_batch_output": "\n\nDeep Learning is a subfield of Machine Learning that focuses on building neural networks with multiple layers of interconnected nodes. These networks are designed to learn from large", # "expected_batch_output": "\n\nDeep Learning is a subfield of Machine Learning that focuses on building neural networks with multiple layers of interconnected nodes. These networks are designed to learn from large",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
], # ],
}, # },
"openai-community/gpt2": { # "openai-community/gpt2": {
"model_id": "openai-community/gpt2", # "model_id": "openai-community/gpt2",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": "\n\nDeep learning is a new field of research that has been around for a long time. It is a new field of research that has been around for a", # "expected_greedy_output": "\n\nDeep learning is a new field of research that has been around for a long time. It is a new field of research that has been around for a",
"expected_batch_output": "\n\nDeep learning is a new field of research that has been around for a long time. It is a new field of research that has been around for a", # "expected_batch_output": "\n\nDeep learning is a new field of research that has been around for a long time. It is a new field of research that has been around for a",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
], # ],
}, # },
"facebook/opt-125m": { # "facebook/opt-125m": {
"model_id": "facebook/opt-125m", # "model_id": "facebook/opt-125m",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": "\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout", # "expected_greedy_output": "\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout",
"expected_batch_output": "\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout", # "expected_batch_output": "\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout the Author\n\nAbout",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
], # ],
}, # },
"EleutherAI/gpt-j-6b": { # "EleutherAI/gpt-j-6b": {
"model_id": "EleutherAI/gpt-j-6b", # "model_id": "EleutherAI/gpt-j-6b",
"input": "What is Deep Learning?", # "input": "What is Deep Learning?",
"expected_greedy_output": "\n\nDeep learning is a subset of machine learning that is based on the idea of neural networks. Neural networks are a type of artificial intelligence that is inspired by", # "expected_greedy_output": "\n\nDeep learning is a subset of machine learning that is based on the idea of neural networks. Neural networks are a type of artificial intelligence that is inspired by",
"expected_batch_output": "\n\nDeep learning is a subset of machine learning that is based on the idea of neural networks. Neural networks are a type of artificial intelligence that is inspired by", # "expected_batch_output": "\n\nDeep learning is a subset of machine learning that is based on the idea of neural networks. Neural networks are a type of artificial intelligence that is inspired by",
"args": [ # "args": [
"--max-input-tokens", # "--max-input-tokens",
"512", # "512",
"--max-total-tokens", # "--max-total-tokens",
"1024", # "1024",
"--max-batch-size", # "--max-batch-size",
"4", # "4",
], # ],
}, # },
} }
print(f"Testing {len(TEST_CONFIGS)} models") print(f"Testing {len(TEST_CONFIGS)} models")