PDF Document
Extracted Data
Comparison
Fields
Raw Text
Prompts
Schema
LLM Extracted Data
{
"absentees": [
{
"name": "Mr. Clark Davis"
}
],
"agendaItems": [
"brand proactive infrastructures",
"deploy world-class niches",
"expedite next-generation experiences"
],
"attendees": [
{
"name": "Jessie Schuster",
"title": "District Web Planner"
},
{
"name": "Mike Feil",
"title": "Central Directives Planner"
},
{
"name": "Eva Funk",
"title": "Internal Identity Executive"
}
],
"chairman": {
"name": "Mrs. Tonya Doyle V",
"title": "Regional Identity Representative"
},
"date": "2025-05-07",
"endTime": "13:00",
"location": "Bartoletti LLC Headquarters, Linden",
"meetingNumber": "2026-5",
"meetingType": "board_meeting",
"notes": "Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax.",
"resolutions": [
{
"abstentions": 0,
"description": "Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio\nviridis tepidus.",
"number": "1",
"passed": true,
"title": "monetize B2C architectures",
"votesAgainst": 0,
"votesFor": 3
},
{
"abstentions": 1,
"description": "Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene\ninflammatio.",
"number": "2",
"passed": false,
"title": "brand ubiquitous relationships",
"votesAgainst": 1,
"votesFor": 1
},
{
"abstentions": 0,
"description": "Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne\nvicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca\nconcedo ullus.",
"number": "3",
"passed": true,
"title": "monetize intuitive networks",
"votesAgainst": 0,
"votesFor": 3
}
],
"secretary": {
"name": "Terence Batz",
"title": "Principal Factors Developer"
},
"signatures": [
{
"name": "Mrs. Tonya Doyle V",
"role": "Chairman",
"signedDate": "2025-05-07",
"title": "Regional Identity Representative"
},
{
"name": "Terence Batz",
"role": "Secretary",
"signedDate": "2025-05-07",
"title": "Principal Factors Developer"
}
],
"startTime": "12:00"
}
Side-by-Side Comparison
Extracted
{
"absentees": [
{
"name": "Mr. Clark Davis"
}
],
"agendaItems": [
"brand proactive infrastructures",
"deploy world-class niches",
"expedite next-generation experiences"
],
"attendees": [
{
"name": "Jessie Schuster",
"title": "District Web Planner"
},
{
"name": "Mike Feil",
"title": "Central Directives Planner"
},
{
"name": "Eva Funk",
"title": "Internal Identity Executive"
}
],
"chairman": {
"name": "Mrs. Tonya Doyle V",
"title": "Regional Identity Representative"
},
"date": "2025-05-07",
"endTime": "13:00",
"location": "Bartoletti LLC Headquarters, Linden",
"meetingNumber": "2026-5",
"meetingType": "board_meeting",
"notes": "Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax.",
"resolutions": [
{
"abstentions": 0,
"description": "Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio\nviridis tepidus.",
"number": "1",
"passed": true,
"title": "monetize B2C architectures",
"votesAgainst": 0,
"votesFor": 3
},
{
"abstentions": 1,
"description": "Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene\ninflammatio.",
"number": "2",
"passed": false,
"title": "brand ubiquitous relationships",
"votesAgainst": 1,
"votesFor": 1
},
{
"abstentions": 0,
"description": "Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne\nvicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca\nconcedo ullus.",
"number": "3",
"passed": true,
"title": "monetize intuitive networks",
"votesAgainst": 0,
"votesFor": 3
}
],
"secretary": {
"name": "Terence Batz",
"title": "Principal Factors Developer"
},
"signatures": [
{
"name": "Mrs. Tonya Doyle V",
"role": "Chairman",
"signedDate": "2025-05-07",
"title": "Regional Identity Representative"
},
{
"name": "Terence Batz",
"role": "Secretary",
"signedDate": "2025-05-07",
"title": "Principal Factors Developer"
}
],
"startTime": "12:00"
}
Ground Truth
{
"absentees": [
{
"email": "Scot.Stracke97@hotmail.com",
"name": "Mr. Clark Davis",
"title": "Forward Solutions Executive"
}
],
"agendaItems": [
"1. brand proactive infrastructures",
"2. deploy world-class niches",
"3. expedite next-generation experiences"
],
"attendees": [
{
"email": "Landen.Miller@yahoo.com",
"name": "Jessie Schuster",
"title": "District Web Planner"
},
{
"email": "Annamarie93@hotmail.com",
"name": "Mike Feil",
"title": "Central Directives Planner"
},
{
"email": "Guillermo22@gmail.com",
"name": "Eva Funk",
"title": "Internal Identity Executive"
}
],
"category": "protocol",
"chairman": {
"email": "Jalyn8@gmail.com",
"name": "Mrs. Tonya Doyle V",
"title": "Regional Identity Representative"
},
"date": "2025-05-07",
"documentId": "protocol-004-en",
"endTime": "13:00",
"location": "Bartoletti LLC Headquarters, Linden",
"meetingNumber": "2026-5",
"meetingType": "board_meeting",
"notes": "Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax.",
"resolutions": [
{
"abstentions": 0,
"description": "Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio viridis tepidus.",
"number": 1,
"passed": true,
"title": "monetize B2C architectures",
"votesAgainst": 0,
"votesFor": 3
},
{
"abstentions": 1,
"description": "Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene inflammatio.",
"number": 2,
"passed": false,
"title": "brand ubiquitous relationships",
"votesAgainst": 1,
"votesFor": 1
},
{
"abstentions": 0,
"description": "Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne vicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca concedo ullus.",
"number": 3,
"passed": true,
"title": "monetize intuitive networks",
"votesAgainst": 0,
"votesFor": 3
}
],
"secretary": {
"email": "Jacky_Murray@hotmail.com",
"name": "Terence Batz",
"title": "Principal Factors Developer"
},
"signatures": [
{
"name": "Mrs. Tonya Doyle V",
"role": "Chairman",
"signedDate": "2025-05-07",
"title": "Regional Identity Representative"
},
{
"name": "Terence Batz",
"role": "Secretary",
"signedDate": "2025-05-07",
"title": "Principal Factors Developer"
}
],
"startTime": "12:00",
"templateVariant": "default"
}
Field Analysis
Matched
54
Mismatched
0
Missing
1
Accuracy
98.2%
Missing 1
- ? absentees[0].title expected "Forward Solutions Executive"
Matched 54
- ✓ meetingType
- ✓ resolutions[1].number
- ✓ secretary.title
- ✓ resolutions[2].votesFor
- ✓ resolutions[0].abstentions
- ✓ signatures[0].role
- ✓ signatures[1].name
- ✓ agendaItems[0]
- ✓ resolutions[2].votesAgainst
- ✓ endTime
- ✓ resolutions[0].votesAgainst
- ✓ resolutions[2].title
- ✓ location
- ✓ attendees[2].name
- ✓ attendees[2].title
- ✓ meetingNumber
- ✓ signatures[1].role
- ✓ signatures[1].title
- ✓ resolutions[1].votesFor
- ✓ resolutions[1].passed
- ✓ resolutions[2].passed
- ✓ resolutions[2].number
- ✓ attendees._length
- ✓ resolutions[0].title
- ✓ secretary.name
- ✓ resolutions[1].votesAgainst
- ✓ attendees[0].name
- ✓ attendees[1].title
- ✓ resolutions[0].description
- ✓ signatures[0].name
- ✓ resolutions[1].abstentions
- ✓ chairman.name
- ✓ chairman.title
- ✓ agendaItems[2]
- ✓ resolutions[0].votesFor
- ✓ absentees[0].name
- ✓ resolutions[2].description
- ✓ attendees[1].name
- ✓ signatures._length
- ✓ resolutions[1].title
- ✓ resolutions[1].description
- ✓ agendaItems[1]
- ✓ signatures[1].signedDate
- ✓ attendees[0].title
- ✓ resolutions[0].passed
- ✓ absentees._length
- ✓ signatures[0].title
- ✓ startTime
- ✓ signatures[0].signedDate
- ✓ agendaItems._length
- ✓ date
- ✓ resolutions[0].number
- ✓ resolutions[2].abstentions
- ✓ resolutions._length
Extracted Text from PDF
MEETING PROTOCOL Meeting Type: BOARD MEETING Meeting Number: 2026-5 Date: 2025-05-07 Time: 12:00 - 13:00 Location: Bartoletti LLC Headquarters, Linden Officers Chairman: Mrs. Tonya Doyle V (Regional Identity Representative) Secretary: Terence Batz (Principal Factors Developer) Attendees • Jessie Schuster - District Web Planner • Mike Feil - Central Directives Planner • Eva Funk - Internal Identity Executive Absent • Mr. Clark Davis Agenda 1. brand proactive infrastructures 2. deploy world-class niches 3. expedite next-generation experiences Resolutions Resolution 1: monetize B2C architectures Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio viridis tepidus. Votes: For: 3, Against: 0, Abstentions: 0 Result: PASSED Resolution 2: brand ubiquitous relationships Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene inflammatio. Votes: For: 1, Against: 1, Abstentions: 1 Result: NOT PASSED Resolution 3: monetize intuitive networks Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne vicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca concedo ullus. Votes: For: 3, Against: 0, Abstentions: 0 Result: PASSED Notes Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax. Certification We hereby certify that these minutes are an accurate record of the proceedings. _______________________________ Chairman: Mrs. Tonya Doyle V Regional Identity Representative Date: 2025-05-07 _______________________________ Secretary: Terence Batz Principal Factors Developer Date: 2025-05-07
System Prompt
You are a precise document data extraction expert. Your task is to extract structured data from protocol documents. ## Extraction Guidelines Extract meeting protocol data including: - Meeting type, number, date, start/end times, location - Chairman and secretary (name, title, email) - Attendees and absentees (arrays of objects with name, title, email) - Agenda items (array of strings) - Resolutions (number, title, description, votes, passed status) ## Important Rules 1. **Dates**: Always use ISO format (YYYY-MM-DD) for full dates, HH:MM for times 2. **Currency**: Use 3-letter ISO 4217 codes (EUR, USD, GBP, etc.) 3. **Missing optional fields**: Omit them entirely, don't use null or empty strings 4. **Required fields**: Make your best effort to extract; if truly not present, use reasonable placeholder 5. **Numbers**: Extract as numeric values, not strings (except for identifiers like document numbers) 6. **Arrays**: Always return arrays even if only one item exists 7. **Text content**: Preserve important content accurately but you may summarize very long passages 8. **Names**: Extract full names as they appear in the document Respond with a JSON object containing the extracted data. Be precise and extract only what is explicitly stated in the document.
User Prompt
Please extract all structured data from this protocol document: --- MEETING PROTOCOL Meeting Type: BOARD MEETING Meeting Number: 2026-5 Date: 2025-05-07 Time: 12:00 - 13:00 Location: Bartoletti LLC Headquarters, Linden Officers Chairman: Mrs. Tonya Doyle V (Regional Identity Representative) Secretary: Terence Batz (Principal Factors Developer) Attendees • Jessie Schuster - District Web Planner • Mike Feil - Central Directives Planner • Eva Funk - Internal Identity Executive Absent • Mr. Clark Davis Agenda 1. brand proactive infrastructures 2. deploy world-class niches 3. expedite next-generation experiences Resolutions Resolution 1: monetize B2C architectures Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio viridis tepidus. Votes: For: 3, Against: 0, Abstentions: 0 Result: PASSED Resolution 2: brand ubiquitous relationships Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene inflammatio. Votes: For: 1, Against: 1, Abstentions: 1 Result: NOT PASSED Resolution 3: monetize intuitive networks Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne vicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca concedo ullus. Votes: For: 3, Against: 0, Abstentions: 0 Result: PASSED Notes Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax. Certification We hereby certify that these minutes are an accurate record of the proceedings. _______________________________ Chairman: Mrs. Tonya Doyle V Regional Identity Representative Date: 2025-05-07 _______________________________ Secretary: Terence Batz Principal Factors Developer Date: 2025-05-07 --- Extract the data as JSON according to the schema.
Raw LLM Response
{
"meetingType": "board_meeting",
"date": "2025-05-07",
"chairman": {
"name": "Mrs. Tonya Doyle V",
"title": "Regional Identity Representative"
},
"absentees": [
{
"name": "Mr. Clark Davis"
}
],
"signatures": [
{
"role": "Chairman",
"name": "Mrs. Tonya Doyle V",
"signedDate": "2025-05-07",
"title": "Regional Identity Representative"
},
{
"role": "Secretary",
"name": "Terence Batz",
"signedDate": "2025-05-07",
"title": "Principal Factors Developer"
}
],
"agendaItems": [
"brand proactive infrastructures",
"deploy world-class niches",
"expedite next-generation experiences"
],
"attendees": [
{
"name": "Jessie Schuster",
"title": "District Web Planner"
},
{
"name": "Mike Feil",
"title": "Central Directives Planner"
},
{
"name": "Eva Funk",
"title": "Internal Identity Executive"
}
],
"endTime": "13:00",
"location": "Bartoletti LLC Headquarters, Linden",
"meetingNumber": "2026-5",
"notes": "Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax.",
"resolutions": [
{
"number": "1",
"title": "monetize B2C architectures",
"passed": true,
"votesFor": 3,
"votesAgainst": 0,
"abstentions": 0,
"description": "Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio\nviridis tepidus."
},
{
"number": "2",
"title": "brand ubiquitous relationships",
"passed": false,
"votesFor": 1,
"votesAgainst": 1,
"abstentions": 1,
"description": "Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene\ninflammatio."
},
{
"number": "3",
"title": "monetize intuitive networks",
"passed": true,
"votesFor": 3,
"votesAgainst": 0,
"abstentions": 0,
"description": "Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne\nvicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca\nconcedo ullus."
}
],
"secretary": {
"name": "Terence Batz",
"title": "Principal Factors Developer"
},
"startTime": "12:00"
}
JSON Schema (Structured Output)
This schema is passed to the LLM via ResponseSchema
to enforce structured JSON output.
{
"example": {
"absentees": [],
"agendaItems": [
"1. Approval of Previous Meeting Minutes",
"2. Financial Report Q1 2024",
"3. Strategic Planning Discussion"
],
"attendees": [
{
"name": "Michael Johnson",
"title": "Chief Financial Officer"
},
{
"name": "Sarah Williams",
"title": "Chief Operating Officer"
}
],
"chairman": {
"name": "John Smith",
"title": "Chairman of the Board"
},
"date": "2024-03-15",
"endTime": "12:00",
"location": "Corporate Headquarters, Conference Room A",
"meetingNumber": "2024-001",
"meetingType": "board_meeting",
"notes": "Meeting adjourned at 12:00 PM. Next meeting scheduled for April 15, 2024.",
"resolutions": [
{
"abstentions": 0,
"description": "The board approves the proposed Q1 2024 budget of $2.5 million.",
"number": "1",
"passed": true,
"title": "Approval of Q1 Budget",
"votesAgainst": 0,
"votesFor": 4
}
],
"secretary": {
"name": "Jane Doe",
"title": "Corporate Secretary"
},
"signatures": [
{
"name": "John Smith",
"role": "Chairman",
"signedDate": "2024-03-15",
"title": "Chairman of the Board"
},
{
"name": "Jane Doe",
"role": "Secretary",
"signedDate": "2024-03-15",
"title": "Corporate Secretary"
}
],
"startTime": "10:00"
},
"properties": {
"absentees": {
"description": "List of people who were absent from the meeting. Use empty array [] if no absentees.",
"items": {
"properties": {
"email": {
"description": "Email address",
"type": "STRING"
},
"name": {
"description": "Full name of the person",
"type": "STRING"
},
"title": {
"description": "Job title or role",
"type": "STRING"
}
},
"required": [
"name"
],
"type": "OBJECT"
},
"type": "ARRAY"
},
"agendaItems": {
"items": {
"type": "STRING"
},
"type": "ARRAY"
},
"attendees": {
"items": {
"properties": {
"email": {
"description": "Email address",
"type": "STRING"
},
"name": {
"description": "Full name of the person",
"type": "STRING"
},
"title": {
"description": "Job title or role",
"type": "STRING"
}
},
"required": [
"name"
],
"type": "OBJECT"
},
"type": "ARRAY"
},
"chairman": {
"properties": {
"email": {
"description": "Email address",
"type": "STRING"
},
"name": {
"description": "Full name of the person",
"type": "STRING"
},
"title": {
"description": "Job title or role",
"type": "STRING"
}
},
"required": [
"name"
],
"type": "OBJECT"
},
"date": {
"description": "Meeting date in YYYY-MM-DD format",
"type": "STRING"
},
"endTime": {
"description": "End time in HH:MM format",
"type": "STRING"
},
"location": {
"description": "Meeting location",
"type": "STRING"
},
"meetingNumber": {
"description": "Meeting reference number",
"type": "STRING"
},
"meetingType": {
"description": "Type of meeting",
"enum": [
"board_meeting",
"shareholder_meeting",
"annual_general_meeting",
"extraordinary_general_meeting"
],
"type": "STRING"
},
"notes": {
"type": "STRING"
},
"resolutions": {
"items": {
"properties": {
"abstentions": {
"description": "Number of abstentions. Use 0 if none.",
"type": "INTEGER"
},
"description": {
"type": "STRING"
},
"number": {
"type": "STRING"
},
"passed": {
"type": "BOOLEAN"
},
"title": {
"type": "STRING"
},
"votesAgainst": {
"description": "Number of votes against",
"type": "INTEGER"
},
"votesFor": {
"description": "Number of votes in favor",
"type": "INTEGER"
}
},
"required": [
"number",
"title",
"passed",
"votesFor",
"votesAgainst",
"abstentions"
],
"type": "OBJECT"
},
"type": "ARRAY"
},
"secretary": {
"properties": {
"email": {
"description": "Email address",
"type": "STRING"
},
"name": {
"description": "Full name of the person",
"type": "STRING"
},
"title": {
"description": "Job title or role",
"type": "STRING"
}
},
"required": [
"name"
],
"type": "OBJECT"
},
"signatures": {
"description": "Signatures certifying the protocol accuracy. Typically signed by chairman and secretary.",
"items": {
"properties": {
"name": {
"description": "Full name of the person signing",
"type": "STRING"
},
"role": {
"description": "Role of the signatory (e.g., Chairman, Secretary)",
"type": "STRING"
},
"signedDate": {
"description": "Date the protocol was signed in YYYY-MM-DD format",
"type": "STRING"
},
"title": {
"description": "Job title of the signatory",
"type": "STRING"
}
},
"required": [
"role",
"name",
"signedDate"
],
"type": "OBJECT"
},
"type": "ARRAY"
},
"startTime": {
"description": "Start time in HH:MM format",
"type": "STRING"
}
},
"required": [
"meetingType",
"date",
"chairman",
"absentees",
"signatures"
],
"type": "OBJECT"
}