lightudq.prompts
1QNA_EXTRACT_PROMPT = """You are an advanced text analysis system designed to extract key 2information from documents in the form of question-answer pairs. Your task is to analyze the given document 3and create up to {num_questions} question-answer pairs based on the information directly addressed in the text. 4 5First, carefully read the following document: 6 7<document> 8{document} 9</document> 10 11Then extract key questions and their corresponding answers from the document. The answer in each question-answer pair 12should be self-contained and fully comprehensible without needing to refer back to the question or the original document. 13 14After completing your analysis, please format your output as a JSON object that adheres to the following 15schema: 16 17<output_schema> 18{output_schema} 19</output_schema> 20 21 22Remember: 23- The answer in each question-answer pair should be self-contained and fully comprehensible without needing to refer 24 back to the question or the original document. 25- Your final output must be strictly in the JSON format specified by the output_schema. 26- Double-check your JSON structure before finalizing your response. 27- Do not output any reasoning or justifications 28""" 29 30 31MISSING_QUESTIONS_PROMPT = """Check if the following document answers the following questions. 32<document> 33{document} 34</document> 35 36<questions> 37{questions} 38</questions> 39 40Output just the list of questions (if any) not answered by the document, with the following output schema. 41<output_schema> 42{output_schema} 43</output_schema> 44""" 45 46 47FACT_CHECK_PROMPT = """You are a precise and thorough fact-checker. Your task is to verify if a given document directly 48contradicts a set of provided facts. You must ignore any facts that are not present in the document. 49Here is the document to analyze: 50<document> 51{document} 52</document> 53 54Here are the facts to check: 55<facts> 56{facts} 57</facts> 58 59Here is the schema for the JSON output you must produce: 60<output_schema> 61{output_schema} 62</output_schema> 63 64Please follow these steps: 65 661. Carefully read the document provided. 672. For each fact in the list of facts: 68 a. Determine if the document directly contradicts the fact. Note that : 69 - Any extra information in the fact not present in the document should not be considered a contradiction and 70 be ignored. 71 - If the document describes a different procedure to accomplish the same task in the fact, this should not 72 constitute a contradiction unless the document explicitly states that the described procedure is the only way 73 to accomplish the task 74 b. If fact is not contradicted by the document, ignore the fact. 75 c. If fact is contradicted, capture it in output 762. For each fact in the list of facts: 77 a. Determine if the document directly contradicts the fact. Any extra information in the fact not present in the 78 document should not be considered a contradiction and be ignored. 79 b. If fact is not contradicted by the document, ignore the fact. 80 c. If fact is contradicted, capture it in output 81 823. Construct your output in the JSON format specified by the output_schema. 83 84Examples: 85fact: "an apple is a fruit" 86document: "an orange is a fruit". 87result: no contradiction 88 89fact: "an apple is a fruit and can be eaten after cutting by knife" 90document: "an apple is a fruit" 91result: no contradiction 92 93fact: "an apple is a fruit and can be eaten after cutting by knife" 94document: "an apple is a fruit and can be eaten by biting directly into it" 95result: no contradiction 96 97fact: "an apple is a fruit" 98document: "an apple is a round fruit and can be eaten by biting directly into it" 99result: no contradiction 100 101fact: "an apple is a fruit" 102document: "an apple is not a fruit" 103result: contradiction 104 105fact: "an apple can be eaten in 3 different ways: (1) biting, (2) slicing, (3) cutting" 106document: "here are two different ways of eating apple: (1) biting and (2) cutting" 107result: no contradiction, since extra information in fact not mentioned in document 108 109Remember: 110- Your final output must be strictly in the JSON format specified by the output_schema. 111- Double-check your JSON structure before finalizing your response. 112- Do not output any reasoning or justifications. 113""" 114 115PII_PRESENCE_CHECK_PROMPT = """Check if the following document contains any Personally Identifiable Information (PII). 116<document> 117{document} 118</document> 119 120Structure the output using this json schema: 121<output_schema> 122{output_schema} 123</output_schema> 124 125Do not output any reasoning or justifications. 126""" 127 128SUMMARY_PROMPT = ( 129 "Summarize the following document in no more than 100 words. " 130 "<document>" 131 "{document}" 132 "</document>" 133) 134 135 136CUSTOM_METRIC_PROMPT = ( 137 "Extract the information requested by the prompt below from the document. " 138 "<document>" 139 "{document}" 140 "</document>" 141 "<prompt>" 142 "{prompt}" 143 "</prompt>" 144 "Structure the output using this json schema:" 145 "<output_schema>" 146 "{output_schema}" 147 "</output_schema>" 148)
QNA_EXTRACT_PROMPT =
'You are an advanced text analysis system designed to extract key\ninformation from documents in the form of question-answer pairs. Your task is to analyze the given document\nand create up to {num_questions} question-answer pairs based on the information directly addressed in the text.\n\nFirst, carefully read the following document:\n\n<document>\n{document}\n</document>\n\nThen extract key questions and their corresponding answers from the document. The answer in each question-answer pair\nshould be self-contained and fully comprehensible without needing to refer back to the question or the original document.\n\nAfter completing your analysis, please format your output as a JSON object that adheres to the following\nschema:\n\n<output_schema>\n{output_schema}\n</output_schema>\n\n\nRemember:\n- The answer in each question-answer pair should be self-contained and fully comprehensible without needing to refer\n back to the question or the original document.\n- Your final output must be strictly in the JSON format specified by the output_schema.\n- Double-check your JSON structure before finalizing your response.\n- Do not output any reasoning or justifications\n'
MISSING_QUESTIONS_PROMPT =
'Check if the following document answers the following questions.\n<document>\n{document}\n</document>\n\n<questions>\n{questions}\n</questions>\n\nOutput just the list of questions (if any) not answered by the document, with the following output schema.\n<output_schema>\n{output_schema}\n</output_schema>\n'
FACT_CHECK_PROMPT =
'You are a precise and thorough fact-checker. Your task is to verify if a given document directly\ncontradicts a set of provided facts. You must ignore any facts that are not present in the document.\nHere is the document to analyze:\n<document>\n{document}\n</document>\n\nHere are the facts to check:\n<facts>\n{facts}\n</facts>\n\nHere is the schema for the JSON output you must produce:\n<output_schema>\n{output_schema}\n</output_schema>\n\nPlease follow these steps:\n\n1. Carefully read the document provided.\n2. For each fact in the list of facts:\n a. Determine if the document directly contradicts the fact. Note that :\n - Any extra information in the fact not present in the document should not be considered a contradiction and\n be ignored.\n - If the document describes a different procedure to accomplish the same task in the fact, this should not\n constitute a contradiction unless the document explicitly states that the described procedure is the only way\n to accomplish the task\n b. If fact is not contradicted by the document, ignore the fact.\n c. If fact is contradicted, capture it in output\n2. For each fact in the list of facts:\n a. Determine if the document directly contradicts the fact. Any extra information in the fact not present in the\n document should not be considered a contradiction and be ignored.\n b. If fact is not contradicted by the document, ignore the fact.\n c. If fact is contradicted, capture it in output\n\n3. Construct your output in the JSON format specified by the output_schema.\n\nExamples:\nfact: "an apple is a fruit"\ndocument: "an orange is a fruit".\nresult: no contradiction\n\nfact: "an apple is a fruit and can be eaten after cutting by knife"\ndocument: "an apple is a fruit"\nresult: no contradiction\n\nfact: "an apple is a fruit and can be eaten after cutting by knife"\ndocument: "an apple is a fruit and can be eaten by biting directly into it"\nresult: no contradiction\n\nfact: "an apple is a fruit"\ndocument: "an apple is a round fruit and can be eaten by biting directly into it"\nresult: no contradiction\n\nfact: "an apple is a fruit"\ndocument: "an apple is not a fruit"\nresult: contradiction\n\nfact: "an apple can be eaten in 3 different ways: (1) biting, (2) slicing, (3) cutting"\ndocument: "here are two different ways of eating apple: (1) biting and (2) cutting"\nresult: no contradiction, since extra information in fact not mentioned in document\n\nRemember:\n- Your final output must be strictly in the JSON format specified by the output_schema.\n- Double-check your JSON structure before finalizing your response.\n- Do not output any reasoning or justifications.\n'
PII_PRESENCE_CHECK_PROMPT =
'Check if the following document contains any Personally Identifiable Information (PII).\n<document>\n{document}\n</document>\n\nStructure the output using this json schema:\n<output_schema>\n{output_schema}\n</output_schema>\n\nDo not output any reasoning or justifications.\n'
SUMMARY_PROMPT =
'Summarize the following document in no more than 100 words. <document>{document}</document>'
CUSTOM_METRIC_PROMPT =
'Extract the information requested by the prompt below from the document. <document>{document}</document><prompt>{prompt}</prompt>Structure the output using this json schema:<output_schema>{output_schema}</output_schema>'