# This file holds our sample data (query and documents/corpus).
# We define it here to keep our main script clean.

# A single query string we want to find an answer for.
QUERY = "Which planet is known as the Red Planet?"

# A list of document strings that form our knowledge corpus.
# We will convert these to embeddings and compare them to the query.
DOCUMENTS = [
    "Venus is the second planet from the Sun and is often called Earth's twin because of its similar size and proximity.",
    "Mars is the fourth planet from the Sun and is frequently referred to as the Red Planet due to its reddish appearance caused by iron oxide on its surface.",
    "Jupiter is the fifth and largest planet in our solar system, a gas giant known for its prominent Great Red Spot, a giant storm.",
    "Saturn is the sixth planet from the Sun, famous for its extensive and visible ring system made of ice particles and dust.",
]

# Optional: A more complex example using a list of dictionaries.
# This is useful if you have metadata like titles, which work well with EmbeddingGemma's prompts.
DOCUMENTS_WITH_META = [
    {
        "title": "Venus",
        "text": "Venus is often called Earth's twin because of its similar size and proximity.",
    },
    {
        "title": "Mars",
        "text": "Mars, known for its reddish appearance, is often referred to as the Red Planet.",
    },
    {
        "title": "Jupiter",
        "text": "Jupiter, the largest planet in our solar system, has a prominent red spot.",
    },
    {
        "title": "Saturn",
        "text": "Saturn, famous for its rings, is sometimes mistaken for the Red Planet.",
    },
]