Find answers from the community

Updated last year

yas pllssss

At a glance
yas pllssss
D
1 comment
heres my poverty version lol

for idx, node in enumerate(nodes):
dataset_generator = DatasetGenerator(
[node],
question_gen_query=question_gen_query,
service_context=gpt_4_context,
metadata_mode="all",
)
node_questions_0 = dataset_generator.generate_questions_from_nodes(num=5)
print(f"[Node {idx}] Generated questions:\n {node_questions_0}")
# for each question, get a response
for question in tqdm(node_questions_0):
index = DocumentSummaryIndex([node], service_context=gpt_40613_context)
index2= DocumentSummaryIndex([node], service_context=gpt35_context)

query_engine = index.as_query_engine()
response = query_engine.query(question)
dpo_dataset_dict["prompt"].append(question)
dpo_dataset_dict["chosen"].append(str(response))

query_engine2 = index2.as_query_engine()
response2 = query_engine2.query(question)
dpo_dataset_dict["rejected"].append(str(response2))

# Write the current entry to the file
fp.write(json.dumps(dpo_dataset_dict) + "\n")
# Clear the dictionary for the next entry
dpo_dataset_dict = {
"prompt": [],
"chosen": [],
"rejected": [],
}

fp.close()

using gpt3.5 has rejected prompt bc and use gpt0613 as accepted
Add a reply
Sign up and join the conversation on Discord