Spaces:
Running
Running
File size: 4,757 Bytes
083f13e 8bd40a9 083f13e 8bd40a9 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 |
from .custom_components import QuizParser
from haystack.components.converters import HTMLToDocument
from haystack.components.fetchers import LinkContentFetcher
from haystack.components.generators import OpenAIGenerator
from haystack.components.builders import PromptBuilder
from haystack.components.websearch.serper_dev import SerperDevWebSearch
from haystack.utils import Secret
from haystack import Pipeline
quiz_generation_template = """Given the following text, create 5 multiple choice quizzes in JSON format.
Each question should have 4 different options, and only one of them should be correct.
The options should be unambiguous.
Each option should begin with a letter followed by a period and a space (e.g., "a. option").
The question should also briefly mention the general topic of the text so that it can be understood in isolation.
Each question should not give hints to answer the other questions.
Include challenging questions, which require reasoning.
respond with JSON only, no markdown or descriptions.
example JSON format you should absolutely follow:
{"topic": "a sentence explaining the topic of the text",
"questions":
[
{
"question": "text of the question",
"options": ["a. 1st option", "b. 2nd option", "c. 3rd option", "d. 4th option"],
"right_option": "c" # letter of the right option ("a" for the first, "b" for the second, etc.)
}, ...
]
}
text:
{% for doc in documents %}{{ doc.content|truncate(4000) }}{% endfor %}
"""
quiz_generation_pipeline = Pipeline()
quiz_generation_pipeline.add_component("link_content_fetcher", LinkContentFetcher())
quiz_generation_pipeline.add_component("html_converter", HTMLToDocument())
quiz_generation_pipeline.add_component(
"prompt_builder", PromptBuilder(template=quiz_generation_template)
)
quiz_generation_pipeline.add_component(
"generator",
OpenAIGenerator(
api_key=Secret.from_env_var("GROQ_API_KEY"),
api_base_url="https://api.groq.com/openai/v1",
model="llama3-8b-8192",
generation_kwargs={"max_tokens": 1000, "temperature": 0.5, "top_p": 1},
),
)
quiz_generation_pipeline.add_component("quiz_parser", QuizParser())
quiz_generation_pipeline.connect("link_content_fetcher", "html_converter")
quiz_generation_pipeline.connect("html_converter", "prompt_builder")
quiz_generation_pipeline.connect("prompt_builder", "generator")
quiz_generation_pipeline.connect("generator", "quiz_parser")
closed_book_template = """Answer the following question, specifying one of the options.
The topic is: {{ topic }}.
In the answer, just specify the letter corresponding to the option.
If you don't know the answer, just provide your best guess and do not provide any reasoning.
For example, if you think the answer is the first option, just write "a".
If you think the answer is the second option, just write "b", and so on.
question: {{ question["question"] }}
options: {{ question["options"] }}
chosen option (a, b, c, or d):
"""
closed_book_answer_pipeline = Pipeline()
closed_book_answer_pipeline.add_component(
"prompt_builder", PromptBuilder(template=closed_book_template)
)
closed_book_answer_pipeline.add_component(
"generator",
OpenAIGenerator(
api_key=Secret.from_env_var("GROQ_API_KEY"),
api_base_url="https://api.groq.com/openai/v1",
model="llama3-8b-8192",
generation_kwargs={"max_tokens": 5, "temperature": 0, "top_p": 1},
),
)
closed_book_answer_pipeline.connect("prompt_builder", "generator")
web_rag_template = """Answer the question about "{{topic}}", using your knowledge and the snippets extracted from the web.
In the answer, just specify the letter corresponding to the option.
If you don't know the answer, just provide your best guess and do not provide any reasoning.
For example, if you think the answer is the first option, just write "a".
If you think the answer is the second option, just write "b", and so on.
question: {{ question["question"] }}
options: {{ question["options"] }}
Snippets:
{% for doc in documents %}
- snippet: "{{doc.content}}"
{% endfor %}
chosen option (a, b, c, or d):
"""
web_rag_pipeline = Pipeline()
web_rag_pipeline.add_component("websearch", SerperDevWebSearch(top_k=3))
web_rag_pipeline.add_component(
"prompt_builder", PromptBuilder(template=web_rag_template)
)
web_rag_pipeline.add_component(
"generator",
OpenAIGenerator(
api_key=Secret.from_env_var("GROQ_API_KEY"),
api_base_url="https://api.groq.com/openai/v1",
model="llama3-8b-8192",
generation_kwargs={"max_tokens": 5, "temperature": 0, "top_p": 1},
),
)
web_rag_pipeline.connect("websearch.documents", "prompt_builder.documents")
web_rag_pipeline.connect("prompt_builder", "generator")
|