106 lines
3.8 KiB
JSON
106 lines
3.8 KiB
JSON
{
|
|
"_comment": "This is a template extraction schema. Customize for your specific use case.",
|
|
"_instructions": "Fill in the sections below with your specific extraction requirements.",
|
|
|
|
"objective": "carefully analyze this paper and extract [DESCRIBE YOUR DATA TYPE, e.g., 'empirical observations of X', 'experimental measurements of Y', etc.]",
|
|
|
|
"system_context": "You are a scientific research assistant specializing in [YOUR DOMAIN, e.g., 'ecology', 'chemistry', 'medicine', etc.]. Your task is to analyze scientific papers and extract structured data for systematic review and meta-analysis.",
|
|
|
|
"instructions": [
|
|
"Determine if the paper contains [YOUR CRITERIA, e.g., 'primary empirical data']",
|
|
"If present, extract all [YOUR RECORD TYPE, e.g., 'observation records', 'measurements', 'outcomes']",
|
|
"For each record, extract the following information: [LIST KEY FIELDS]"
|
|
],
|
|
|
|
"analysis_steps": [
|
|
"1. Identify and quote relevant sections containing [YOUR DATA TYPE]",
|
|
"2. List out each [RECORD UNIT, e.g., 'species', 'compound', 'patient cohort']",
|
|
"3. For each unit, extract required information and quote supporting text",
|
|
"4. [ADD DOMAIN-SPECIFIC VALIDATION STEPS]",
|
|
"5. Double-check for accuracy and completeness"
|
|
],
|
|
|
|
"important_notes": [
|
|
"Only include PRIMARY data from this paper, not secondary sources",
|
|
"If a record involves multiple [UNITS], separate into individual records",
|
|
"Do not add fields not in the schema",
|
|
"Use 'none' or empty lists for unknown values",
|
|
"List names exactly as they appear in the source"
|
|
],
|
|
|
|
"output_schema": {
|
|
"type": "object",
|
|
"properties": {
|
|
"has_relevant_data": {
|
|
"type": "boolean",
|
|
"description": "Whether the paper contains the target data type"
|
|
},
|
|
"data_description": {
|
|
"type": "string",
|
|
"description": "Brief explanation of what data is present"
|
|
},
|
|
"records": {
|
|
"type": "array",
|
|
"description": "List of extracted records",
|
|
"items": {
|
|
"type": "object",
|
|
"properties": {
|
|
"_comment": "CUSTOMIZE THESE FIELDS FOR YOUR USE CASE",
|
|
"location": {
|
|
"type": "string",
|
|
"description": "Geographic location (if applicable)"
|
|
},
|
|
"subject": {
|
|
"type": "string",
|
|
"description": "Main subject of the record (species, compound, etc.)"
|
|
},
|
|
"measurement_type": {
|
|
"type": "string",
|
|
"description": "Type of measurement or observation"
|
|
},
|
|
"value": {
|
|
"type": ["number", "string"],
|
|
"description": "Measured or observed value"
|
|
},
|
|
"units": {
|
|
"type": "string",
|
|
"description": "Units of measurement"
|
|
},
|
|
"method": {
|
|
"type": "string",
|
|
"description": "Brief description of methodology"
|
|
},
|
|
"sample_size": {
|
|
"type": "integer",
|
|
"description": "Sample size if applicable"
|
|
},
|
|
"notes": {
|
|
"type": "string",
|
|
"description": "Additional relevant notes"
|
|
}
|
|
},
|
|
"required": ["subject"]
|
|
}
|
|
}
|
|
},
|
|
"required": ["has_relevant_data", "records"]
|
|
},
|
|
|
|
"output_example": {
|
|
"has_relevant_data": true,
|
|
"data_description": "Paper reports 5 observation records across 3 locations",
|
|
"records": [
|
|
{
|
|
"location": "Example Location",
|
|
"subject": "Example Subject",
|
|
"measurement_type": "Example Type",
|
|
"value": 42.5,
|
|
"units": "mg/L",
|
|
"method": "Brief methodology description",
|
|
"sample_size": 20,
|
|
"notes": "Any relevant notes"
|
|
}
|
|
]
|
|
}
|
|
}
|