| # This file holds our sample data (query and documents/corpus). | |
| # We define it here to keep our main script clean. | |
| # A single query string we want to find an answer for. | |
| QUERY = "Which planet is known as the Red Planet?" | |
| # A list of document strings that form our knowledge corpus. | |
| # We will convert these to embeddings and compare them to the query. | |
| DOCUMENTS = [ | |
| "Venus is the second planet from the Sun and is often called Earth's twin because of its similar size and proximity.", | |
| "Mars is the fourth planet from the Sun and is frequently referred to as the Red Planet due to its reddish appearance caused by iron oxide on its surface.", | |
| "Jupiter is the fifth and largest planet in our solar system, a gas giant known for its prominent Great Red Spot, a giant storm.", | |
| "Saturn is the sixth planet from the Sun, famous for its extensive and visible ring system made of ice particles and dust.", | |
| ] | |
| # Optional: A more complex example using a list of dictionaries. | |
| # This is useful if you have metadata like titles, which work well with EmbeddingGemma's prompts. | |
| DOCUMENTS_WITH_META = [ | |
| { | |
| "title": "Venus", | |
| "text": "Venus is often called Earth's twin because of its similar size and proximity.", | |
| }, | |
| { | |
| "title": "Mars", | |
| "text": "Mars, known for its reddish appearance, is often referred to as the Red Planet.", | |
| }, | |
| { | |
| "title": "Jupiter", | |
| "text": "Jupiter, the largest planet in our solar system, has a prominent red spot.", | |
| }, | |
| { | |
| "title": "Saturn", | |
| "text": "Saturn, famous for its rings, is sometimes mistaken for the Red Planet.", | |
| }, | |
| ] | |