PDF Document
Extracted Data
Comparison
Fields
Raw Text
Prompts
Schema
LLM Extracted Data
{
"absentees": [],
"agendaItems": [
"mesh front-end AI",
"orchestrate viral solutions",
"streamline rich solutions",
"exploit rich relationships",
"redefine front-end systems"
],
"attendees": [
{
"name": "Rolando Jast",
"title": "Customer Creative Officer"
},
{
"name": "Erika Pacocha",
"title": "Regional Metrics Technician"
},
{
"name": "Candace Kozey",
"title": "Global Optimization Associate"
},
{
"name": "Miss Tonya Hackett",
"title": "Forward Tactics Administrator"
},
{
"name": "Winston King III",
"title": "Direct Brand Officer"
}
],
"chairman": {
"name": "Terry Harris DVM",
"title": "Human Communications Consultant"
},
"date": "2025-02-28",
"endTime": "14:00",
"location": "Schneider and Sons Headquarters, Smithworth",
"meetingNumber": "2026-12",
"meetingType": "annual_general_meeting",
"notes": "Ustilo subito distinctio confugo. Civitas usque esse adsidue vorax suggero aeneus suadeo appono absens.\nThermae demergo volaticus speculum vespillo ut velut aegrus.",
"resolutions": [
{
"abstentions": 1,
"description": "Trucido aestivus unus quam vita. Adversus adipiscor quibusdam tribuo viscus. Patior combibo voluptatum facilis\numquam ad casso suasoria video apparatus.",
"number": "1",
"passed": true,
"title": "target revolutionary synergies",
"votesAgainst": 0,
"votesFor": 4
},
{
"abstentions": 0,
"description": "Cuppedia sum quisquam carcer aggero alias laboriosam desino neque concido. Apto caries texo absens voveo\nsolutio vilis. Celer esse depono dolore aspicio occaecati laudantium ascit adopto.",
"number": "2",
"passed": true,
"title": "target next-generation supply-chains",
"votesAgainst": 0,
"votesFor": 5
}
],
"secretary": {
"name": "Beverly Nienow",
"title": "District Web Analyst"
},
"signatures": [
{
"name": "Terry Harris DVM",
"role": "Chairman",
"signedDate": "2025-02-28",
"title": "Human Communications Consultant"
},
{
"name": "Beverly Nienow",
"role": "Secretary",
"signedDate": "2025-02-28",
"title": "District Web Analyst"
}
],
"startTime": "12:00"
}
Side-by-Side Comparison
Extracted
{
"absentees": [],
"agendaItems": [
"mesh front-end AI",
"orchestrate viral solutions",
"streamline rich solutions",
"exploit rich relationships",
"redefine front-end systems"
],
"attendees": [
{
"name": "Rolando Jast",
"title": "Customer Creative Officer"
},
{
"name": "Erika Pacocha",
"title": "Regional Metrics Technician"
},
{
"name": "Candace Kozey",
"title": "Global Optimization Associate"
},
{
"name": "Miss Tonya Hackett",
"title": "Forward Tactics Administrator"
},
{
"name": "Winston King III",
"title": "Direct Brand Officer"
}
],
"chairman": {
"name": "Terry Harris DVM",
"title": "Human Communications Consultant"
},
"date": "2025-02-28",
"endTime": "14:00",
"location": "Schneider and Sons Headquarters, Smithworth",
"meetingNumber": "2026-12",
"meetingType": "annual_general_meeting",
"notes": "Ustilo subito distinctio confugo. Civitas usque esse adsidue vorax suggero aeneus suadeo appono absens.\nThermae demergo volaticus speculum vespillo ut velut aegrus.",
"resolutions": [
{
"abstentions": 1,
"description": "Trucido aestivus unus quam vita. Adversus adipiscor quibusdam tribuo viscus. Patior combibo voluptatum facilis\numquam ad casso suasoria video apparatus.",
"number": "1",
"passed": true,
"title": "target revolutionary synergies",
"votesAgainst": 0,
"votesFor": 4
},
{
"abstentions": 0,
"description": "Cuppedia sum quisquam carcer aggero alias laboriosam desino neque concido. Apto caries texo absens voveo\nsolutio vilis. Celer esse depono dolore aspicio occaecati laudantium ascit adopto.",
"number": "2",
"passed": true,
"title": "target next-generation supply-chains",
"votesAgainst": 0,
"votesFor": 5
}
],
"secretary": {
"name": "Beverly Nienow",
"title": "District Web Analyst"
},
"signatures": [
{
"name": "Terry Harris DVM",
"role": "Chairman",
"signedDate": "2025-02-28",
"title": "Human Communications Consultant"
},
{
"name": "Beverly Nienow",
"role": "Secretary",
"signedDate": "2025-02-28",
"title": "District Web Analyst"
}
],
"startTime": "12:00"
}
Ground Truth
{
"absentees": [],
"agendaItems": [
"1. mesh front-end AI",
"2. orchestrate viral solutions",
"3. streamline rich solutions",
"4. exploit rich relationships",
"5. redefine front-end systems"
],
"attendees": [
{
"email": "Josiane.Rempel@gmail.com",
"name": "Rolando Jast",
"title": "Customer Creative Officer"
},
{
"email": "Elisa.Sauer18@hotmail.com",
"name": "Erika Pacocha",
"title": "Regional Metrics Technician"
},
{
"email": "Aliza90@gmail.com",
"name": "Candace Kozey",
"title": "Global Optimization Associate"
},
{
"email": "Jaylon17@gmail.com",
"name": "Miss Tonya Hackett",
"title": "Forward Tactics Administrator"
},
{
"email": "Lafayette92@yahoo.com",
"name": "Winston King III",
"title": "Direct Brand Officer"
}
],
"category": "protocol",
"chairman": {
"email": "Martin_Littel@gmail.com",
"name": "Terry Harris DVM",
"title": "Human Communications Consultant"
},
"date": "2025-02-28",
"documentId": "protocol-002-en",
"endTime": "14:00",
"location": "Schneider and Sons Headquarters, Smithworth",
"meetingNumber": "2026-12",
"meetingType": "annual_general_meeting",
"notes": "Ustilo subito distinctio confugo. Civitas usque esse adsidue vorax suggero aeneus suadeo appono absens. Thermae demergo volaticus speculum vespillo ut velut aegrus.",
"resolutions": [
{
"abstentions": 1,
"description": "Trucido aestivus unus quam vita. Adversus adipiscor quibusdam tribuo viscus. Patior combibo voluptatum facilis umquam ad casso suasoria video apparatus.",
"number": 1,
"passed": true,
"title": "target revolutionary synergies",
"votesAgainst": 0,
"votesFor": 4
},
{
"abstentions": 0,
"description": "Cuppedia sum quisquam carcer aggero alias laboriosam desino neque concido. Apto caries texo absens voveo solutio vilis. Celer esse depono dolore aspicio occaecati laudantium ascit adopto.",
"number": 2,
"passed": true,
"title": "target next-generation supply-chains",
"votesAgainst": 0,
"votesFor": 5
}
],
"secretary": {
"email": "Ruthie_Bernier@yahoo.com",
"name": "Beverly Nienow",
"title": "District Web Analyst"
},
"signatures": [
{
"name": "Terry Harris DVM",
"role": "Chairman",
"signedDate": "2025-02-28",
"title": "Human Communications Consultant"
},
{
"name": "Beverly Nienow",
"role": "Secretary",
"signedDate": "2025-02-28",
"title": "District Web Analyst"
}
],
"startTime": "12:00",
"templateVariant": "default"
}
Field Analysis
Matched
52
Mismatched
0
Missing
0
Accuracy
100.0%
Matched 52
- ✓ attendees[1].name
- ✓ resolutions[1].title
- ✓ chairman.title
- ✓ signatures[0].name
- ✓ signatures[0].signedDate
- ✓ attendees[0].title
- ✓ attendees[1].title
- ✓ agendaItems[4]
- ✓ resolutions[1].abstentions
- ✓ secretary.title
- ✓ date
- ✓ agendaItems[3]
- ✓ attendees[2].name
- ✓ resolutions[0].votesFor
- ✓ resolutions[1].votesAgainst
- ✓ signatures[0].role
- ✓ signatures[0].title
- ✓ signatures[1].role
- ✓ attendees[4].name
- ✓ location
- ✓ resolutions[1].votesFor
- ✓ signatures[1].title
- ✓ signatures[1].signedDate
- ✓ attendees[3].name
- ✓ absentees._length
- ✓ meetingNumber
- ✓ attendees[3].title
- ✓ agendaItems[1]
- ✓ signatures[1].name
- ✓ startTime
- ✓ chairman.name
- ✓ attendees[4].title
- ✓ resolutions[0].title
- ✓ endTime
- ✓ attendees[0].name
- ✓ attendees._length
- ✓ resolutions[0].abstentions
- ✓ resolutions[0].description
- ✓ resolutions[0].votesAgainst
- ✓ signatures._length
- ✓ resolutions[1].passed
- ✓ resolutions._length
- ✓ resolutions[0].number
- ✓ secretary.name
- ✓ attendees[2].title
- ✓ agendaItems[0]
- ✓ agendaItems._length
- ✓ resolutions[1].description
- ✓ meetingType
- ✓ agendaItems[2]
- ✓ resolutions[0].passed
- ✓ resolutions[1].number
Extracted Text from PDF
MEETING PROTOCOL Meeting Type: ANNUAL GENERAL MEETING Meeting Number: 2026-12 Date: 2025-02-28 Time: 12:00 - 14:00 Location: Schneider and Sons Headquarters, Smithworth Officers Chairman: Terry Harris DVM (Human Communications Consultant) Secretary: Beverly Nienow (District Web Analyst) Attendees • Rolando Jast - Customer Creative Officer • Erika Pacocha - Regional Metrics Technician • Candace Kozey - Global Optimization Associate • Miss Tonya Hackett - Forward Tactics Administrator • Winston King III - Direct Brand Officer Agenda 1. mesh front-end AI 2. orchestrate viral solutions 3. streamline rich solutions 4. exploit rich relationships 5. redefine front-end systems Resolutions Resolution 1: target revolutionary synergies Trucido aestivus unus quam vita. Adversus adipiscor quibusdam tribuo viscus. Patior combibo voluptatum facilis umquam ad casso suasoria video apparatus. Votes: For: 4, Against: 0, Abstentions: 1 Result: PASSED Resolution 2: target next-generation supply-chains Cuppedia sum quisquam carcer aggero alias laboriosam desino neque concido. Apto caries texo absens voveo solutio vilis. Celer esse depono dolore aspicio occaecati laudantium ascit adopto. Votes: For: 5, Against: 0, Abstentions: 0 Result: PASSED Notes Ustilo subito distinctio confugo. Civitas usque esse adsidue vorax suggero aeneus suadeo appono absens. Thermae demergo volaticus speculum vespillo ut velut aegrus. Certification We hereby certify that these minutes are an accurate record of the proceedings. _______________________________ Chairman: Terry Harris DVM Human Communications Consultant Date: 2025-02-28 _______________________________ Secretary: Beverly Nienow District Web Analyst Date: 2025-02-28
System Prompt
You are a precise document data extraction expert. Your task is to extract structured data from protocol documents. ## Extraction Guidelines Extract meeting protocol data including: - Meeting type, number, date, start/end times, location - Chairman and secretary (name, title, email) - Attendees and absentees (arrays of objects with name, title, email) - Agenda items (array of strings) - Resolutions (number, title, description, votes, passed status) ## Important Rules 1. **Dates**: Always use ISO format (YYYY-MM-DD) for full dates, HH:MM for times 2. **Currency**: Use 3-letter ISO 4217 codes (EUR, USD, GBP, etc.) 3. **Missing optional fields**: Omit them entirely, don't use null or empty strings 4. **Required fields**: Make your best effort to extract; if truly not present, use reasonable placeholder 5. **Numbers**: Extract as numeric values, not strings (except for identifiers like document numbers) 6. **Arrays**: Always return arrays even if only one item exists 7. **Text content**: Preserve important content accurately but you may summarize very long passages 8. **Names**: Extract full names as they appear in the document Respond with a JSON object containing the extracted data. Be precise and extract only what is explicitly stated in the document.
User Prompt
Please extract all structured data from this protocol document: --- MEETING PROTOCOL Meeting Type: ANNUAL GENERAL MEETING Meeting Number: 2026-12 Date: 2025-02-28 Time: 12:00 - 14:00 Location: Schneider and Sons Headquarters, Smithworth Officers Chairman: Terry Harris DVM (Human Communications Consultant) Secretary: Beverly Nienow (District Web Analyst) Attendees • Rolando Jast - Customer Creative Officer • Erika Pacocha - Regional Metrics Technician • Candace Kozey - Global Optimization Associate • Miss Tonya Hackett - Forward Tactics Administrator • Winston King III - Direct Brand Officer Agenda 1. mesh front-end AI 2. orchestrate viral solutions 3. streamline rich solutions 4. exploit rich relationships 5. redefine front-end systems Resolutions Resolution 1: target revolutionary synergies Trucido aestivus unus quam vita. Adversus adipiscor quibusdam tribuo viscus. Patior combibo voluptatum facilis umquam ad casso suasoria video apparatus. Votes: For: 4, Against: 0, Abstentions: 1 Result: PASSED Resolution 2: target next-generation supply-chains Cuppedia sum quisquam carcer aggero alias laboriosam desino neque concido. Apto caries texo absens voveo solutio vilis. Celer esse depono dolore aspicio occaecati laudantium ascit adopto. Votes: For: 5, Against: 0, Abstentions: 0 Result: PASSED Notes Ustilo subito distinctio confugo. Civitas usque esse adsidue vorax suggero aeneus suadeo appono absens. Thermae demergo volaticus speculum vespillo ut velut aegrus. Certification We hereby certify that these minutes are an accurate record of the proceedings. _______________________________ Chairman: Terry Harris DVM Human Communications Consultant Date: 2025-02-28 _______________________________ Secretary: Beverly Nienow District Web Analyst Date: 2025-02-28 --- Extract the data as JSON according to the schema.
Raw LLM Response
{
"meetingType": "annual_general_meeting",
"date": "2025-02-28",
"chairman": {
"name": "Terry Harris DVM",
"title": "Human Communications Consultant"
},
"absentees": [],
"signatures": [
{
"role": "Chairman",
"name": "Terry Harris DVM",
"signedDate": "2025-02-28",
"title": "Human Communications Consultant"
},
{
"role": "Secretary",
"name": "Beverly Nienow",
"signedDate": "2025-02-28",
"title": "District Web Analyst"
}
],
"agendaItems": [
"mesh front-end AI",
"orchestrate viral solutions",
"streamline rich solutions",
"exploit rich relationships",
"redefine front-end systems"
],
"attendees": [
{
"name": "Rolando Jast",
"title": "Customer Creative Officer"
},
{
"name": "Erika Pacocha",
"title": "Regional Metrics Technician"
},
{
"name": "Candace Kozey",
"title": "Global Optimization Associate"
},
{
"name": "Miss Tonya Hackett",
"title": "Forward Tactics Administrator"
},
{
"name": "Winston King III",
"title": "Direct Brand Officer"
}
],
"endTime": "14:00",
"location": "Schneider and Sons Headquarters, Smithworth",
"meetingNumber": "2026-12",
"notes": "Ustilo subito distinctio confugo. Civitas usque esse adsidue vorax suggero aeneus suadeo appono absens.\nThermae demergo volaticus speculum vespillo ut velut aegrus.",
"resolutions": [
{
"number": "1",
"title": "target revolutionary synergies",
"passed": true,
"votesFor": 4,
"votesAgainst": 0,
"abstentions": 1,
"description": "Trucido aestivus unus quam vita. Adversus adipiscor quibusdam tribuo viscus. Patior combibo voluptatum facilis\numquam ad casso suasoria video apparatus."
},
{
"number": "2",
"title": "target next-generation supply-chains",
"passed": true,
"votesFor": 5,
"votesAgainst": 0,
"abstentions": 0,
"description": "Cuppedia sum quisquam carcer aggero alias laboriosam desino neque concido. Apto caries texo absens voveo\nsolutio vilis. Celer esse depono dolore aspicio occaecati laudantium ascit adopto."
}
],
"secretary": {
"name": "Beverly Nienow",
"title": "District Web Analyst"
},
"startTime": "12:00"
}
JSON Schema (Structured Output)
This schema is passed to the LLM via ResponseSchema
to enforce structured JSON output.
{
"example": {
"absentees": [],
"agendaItems": [
"1. Approval of Previous Meeting Minutes",
"2. Financial Report Q1 2024",
"3. Strategic Planning Discussion"
],
"attendees": [
{
"name": "Michael Johnson",
"title": "Chief Financial Officer"
},
{
"name": "Sarah Williams",
"title": "Chief Operating Officer"
}
],
"chairman": {
"name": "John Smith",
"title": "Chairman of the Board"
},
"date": "2024-03-15",
"endTime": "12:00",
"location": "Corporate Headquarters, Conference Room A",
"meetingNumber": "2024-001",
"meetingType": "board_meeting",
"notes": "Meeting adjourned at 12:00 PM. Next meeting scheduled for April 15, 2024.",
"resolutions": [
{
"abstentions": 0,
"description": "The board approves the proposed Q1 2024 budget of $2.5 million.",
"number": "1",
"passed": true,
"title": "Approval of Q1 Budget",
"votesAgainst": 0,
"votesFor": 4
}
],
"secretary": {
"name": "Jane Doe",
"title": "Corporate Secretary"
},
"signatures": [
{
"name": "John Smith",
"role": "Chairman",
"signedDate": "2024-03-15",
"title": "Chairman of the Board"
},
{
"name": "Jane Doe",
"role": "Secretary",
"signedDate": "2024-03-15",
"title": "Corporate Secretary"
}
],
"startTime": "10:00"
},
"properties": {
"absentees": {
"description": "List of people who were absent from the meeting. Use empty array [] if no absentees.",
"items": {
"properties": {
"email": {
"description": "Email address",
"type": "STRING"
},
"name": {
"description": "Full name of the person",
"type": "STRING"
},
"title": {
"description": "Job title or role",
"type": "STRING"
}
},
"required": [
"name"
],
"type": "OBJECT"
},
"type": "ARRAY"
},
"agendaItems": {
"items": {
"type": "STRING"
},
"type": "ARRAY"
},
"attendees": {
"items": {
"properties": {
"email": {
"description": "Email address",
"type": "STRING"
},
"name": {
"description": "Full name of the person",
"type": "STRING"
},
"title": {
"description": "Job title or role",
"type": "STRING"
}
},
"required": [
"name"
],
"type": "OBJECT"
},
"type": "ARRAY"
},
"chairman": {
"properties": {
"email": {
"description": "Email address",
"type": "STRING"
},
"name": {
"description": "Full name of the person",
"type": "STRING"
},
"title": {
"description": "Job title or role",
"type": "STRING"
}
},
"required": [
"name"
],
"type": "OBJECT"
},
"date": {
"description": "Meeting date in YYYY-MM-DD format",
"type": "STRING"
},
"endTime": {
"description": "End time in HH:MM format",
"type": "STRING"
},
"location": {
"description": "Meeting location",
"type": "STRING"
},
"meetingNumber": {
"description": "Meeting reference number",
"type": "STRING"
},
"meetingType": {
"description": "Type of meeting",
"enum": [
"board_meeting",
"shareholder_meeting",
"annual_general_meeting",
"extraordinary_general_meeting"
],
"type": "STRING"
},
"notes": {
"type": "STRING"
},
"resolutions": {
"items": {
"properties": {
"abstentions": {
"description": "Number of abstentions. Use 0 if none.",
"type": "INTEGER"
},
"description": {
"type": "STRING"
},
"number": {
"type": "STRING"
},
"passed": {
"type": "BOOLEAN"
},
"title": {
"type": "STRING"
},
"votesAgainst": {
"description": "Number of votes against",
"type": "INTEGER"
},
"votesFor": {
"description": "Number of votes in favor",
"type": "INTEGER"
}
},
"required": [
"number",
"title",
"passed",
"votesFor",
"votesAgainst",
"abstentions"
],
"type": "OBJECT"
},
"type": "ARRAY"
},
"secretary": {
"properties": {
"email": {
"description": "Email address",
"type": "STRING"
},
"name": {
"description": "Full name of the person",
"type": "STRING"
},
"title": {
"description": "Job title or role",
"type": "STRING"
}
},
"required": [
"name"
],
"type": "OBJECT"
},
"signatures": {
"description": "Signatures certifying the protocol accuracy. Typically signed by chairman and secretary.",
"items": {
"properties": {
"name": {
"description": "Full name of the person signing",
"type": "STRING"
},
"role": {
"description": "Role of the signatory (e.g., Chairman, Secretary)",
"type": "STRING"
},
"signedDate": {
"description": "Date the protocol was signed in YYYY-MM-DD format",
"type": "STRING"
},
"title": {
"description": "Job title of the signatory",
"type": "STRING"
}
},
"required": [
"role",
"name",
"signedDate"
],
"type": "OBJECT"
},
"type": "ARRAY"
},
"startTime": {
"description": "Start time in HH:MM format",
"type": "STRING"
}
},
"required": [
"meetingType",
"date",
"chairman",
"absentees",
"signatures"
],
"type": "OBJECT"
}