← Back

protocol-004-en extraction

98.2%
Model: gemini-2.0-flash
Latency: 6.763s
Tokens: 1385/805
PDF Document
Extracted Data
Comparison
Fields
Raw Text
Prompts
Schema
LLM Extracted Data
{
  "absentees": [
    {
      "name": "Mr. Clark Davis"
    }
  ],
  "agendaItems": [
    "brand proactive infrastructures",
    "deploy world-class niches",
    "expedite next-generation experiences"
  ],
  "attendees": [
    {
      "name": "Jessie Schuster",
      "title": "District Web Planner"
    },
    {
      "name": "Mike Feil",
      "title": "Central Directives Planner"
    },
    {
      "name": "Eva Funk",
      "title": "Internal Identity Executive"
    }
  ],
  "chairman": {
    "name": "Mrs. Tonya Doyle V",
    "title": "Regional Identity Representative"
  },
  "date": "2025-05-07",
  "endTime": "13:00",
  "location": "Bartoletti LLC Headquarters, Linden",
  "meetingNumber": "2026-5",
  "meetingType": "board_meeting",
  "notes": "Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax.",
  "resolutions": [
    {
      "abstentions": 0,
      "description": "Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio\nviridis tepidus.",
      "number": "1",
      "passed": true,
      "title": "monetize B2C architectures",
      "votesAgainst": 0,
      "votesFor": 3
    },
    {
      "abstentions": 1,
      "description": "Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene\ninflammatio.",
      "number": "2",
      "passed": false,
      "title": "brand ubiquitous relationships",
      "votesAgainst": 1,
      "votesFor": 1
    },
    {
      "abstentions": 0,
      "description": "Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne\nvicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca\nconcedo ullus.",
      "number": "3",
      "passed": true,
      "title": "monetize intuitive networks",
      "votesAgainst": 0,
      "votesFor": 3
    }
  ],
  "secretary": {
    "name": "Terence Batz",
    "title": "Principal Factors Developer"
  },
  "signatures": [
    {
      "name": "Mrs. Tonya Doyle V",
      "role": "Chairman",
      "signedDate": "2025-05-07",
      "title": "Regional Identity Representative"
    },
    {
      "name": "Terence Batz",
      "role": "Secretary",
      "signedDate": "2025-05-07",
      "title": "Principal Factors Developer"
    }
  ],
  "startTime": "12:00"
}
Side-by-Side Comparison

Extracted

{
  "absentees": [
    {
      "name": "Mr. Clark Davis"
    }
  ],
  "agendaItems": [
    "brand proactive infrastructures",
    "deploy world-class niches",
    "expedite next-generation experiences"
  ],
  "attendees": [
    {
      "name": "Jessie Schuster",
      "title": "District Web Planner"
    },
    {
      "name": "Mike Feil",
      "title": "Central Directives Planner"
    },
    {
      "name": "Eva Funk",
      "title": "Internal Identity Executive"
    }
  ],
  "chairman": {
    "name": "Mrs. Tonya Doyle V",
    "title": "Regional Identity Representative"
  },
  "date": "2025-05-07",
  "endTime": "13:00",
  "location": "Bartoletti LLC Headquarters, Linden",
  "meetingNumber": "2026-5",
  "meetingType": "board_meeting",
  "notes": "Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax.",
  "resolutions": [
    {
      "abstentions": 0,
      "description": "Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio\nviridis tepidus.",
      "number": "1",
      "passed": true,
      "title": "monetize B2C architectures",
      "votesAgainst": 0,
      "votesFor": 3
    },
    {
      "abstentions": 1,
      "description": "Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene\ninflammatio.",
      "number": "2",
      "passed": false,
      "title": "brand ubiquitous relationships",
      "votesAgainst": 1,
      "votesFor": 1
    },
    {
      "abstentions": 0,
      "description": "Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne\nvicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca\nconcedo ullus.",
      "number": "3",
      "passed": true,
      "title": "monetize intuitive networks",
      "votesAgainst": 0,
      "votesFor": 3
    }
  ],
  "secretary": {
    "name": "Terence Batz",
    "title": "Principal Factors Developer"
  },
  "signatures": [
    {
      "name": "Mrs. Tonya Doyle V",
      "role": "Chairman",
      "signedDate": "2025-05-07",
      "title": "Regional Identity Representative"
    },
    {
      "name": "Terence Batz",
      "role": "Secretary",
      "signedDate": "2025-05-07",
      "title": "Principal Factors Developer"
    }
  ],
  "startTime": "12:00"
}

Ground Truth

{
  "absentees": [
    {
      "email": "Scot.Stracke97@hotmail.com",
      "name": "Mr. Clark Davis",
      "title": "Forward Solutions Executive"
    }
  ],
  "agendaItems": [
    "1. brand proactive infrastructures",
    "2. deploy world-class niches",
    "3. expedite next-generation experiences"
  ],
  "attendees": [
    {
      "email": "Landen.Miller@yahoo.com",
      "name": "Jessie Schuster",
      "title": "District Web Planner"
    },
    {
      "email": "Annamarie93@hotmail.com",
      "name": "Mike Feil",
      "title": "Central Directives Planner"
    },
    {
      "email": "Guillermo22@gmail.com",
      "name": "Eva Funk",
      "title": "Internal Identity Executive"
    }
  ],
  "category": "protocol",
  "chairman": {
    "email": "Jalyn8@gmail.com",
    "name": "Mrs. Tonya Doyle V",
    "title": "Regional Identity Representative"
  },
  "date": "2025-05-07",
  "documentId": "protocol-004-en",
  "endTime": "13:00",
  "location": "Bartoletti LLC Headquarters, Linden",
  "meetingNumber": "2026-5",
  "meetingType": "board_meeting",
  "notes": "Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax.",
  "resolutions": [
    {
      "abstentions": 0,
      "description": "Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio viridis tepidus.",
      "number": 1,
      "passed": true,
      "title": "monetize B2C architectures",
      "votesAgainst": 0,
      "votesFor": 3
    },
    {
      "abstentions": 1,
      "description": "Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene inflammatio.",
      "number": 2,
      "passed": false,
      "title": "brand ubiquitous relationships",
      "votesAgainst": 1,
      "votesFor": 1
    },
    {
      "abstentions": 0,
      "description": "Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne vicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca concedo ullus.",
      "number": 3,
      "passed": true,
      "title": "monetize intuitive networks",
      "votesAgainst": 0,
      "votesFor": 3
    }
  ],
  "secretary": {
    "email": "Jacky_Murray@hotmail.com",
    "name": "Terence Batz",
    "title": "Principal Factors Developer"
  },
  "signatures": [
    {
      "name": "Mrs. Tonya Doyle V",
      "role": "Chairman",
      "signedDate": "2025-05-07",
      "title": "Regional Identity Representative"
    },
    {
      "name": "Terence Batz",
      "role": "Secretary",
      "signedDate": "2025-05-07",
      "title": "Principal Factors Developer"
    }
  ],
  "startTime": "12:00",
  "templateVariant": "default"
}
Field Analysis
Matched
54
Mismatched
0
Missing
1
Accuracy
98.2%

Missing 1

  • ? absentees[0].title expected "Forward Solutions Executive"

Matched 54

  • ✓ meetingType
  • ✓ resolutions[1].number
  • ✓ secretary.title
  • ✓ resolutions[2].votesFor
  • ✓ resolutions[0].abstentions
  • ✓ signatures[0].role
  • ✓ signatures[1].name
  • ✓ agendaItems[0]
  • ✓ resolutions[2].votesAgainst
  • ✓ endTime
  • ✓ resolutions[0].votesAgainst
  • ✓ resolutions[2].title
  • ✓ location
  • ✓ attendees[2].name
  • ✓ attendees[2].title
  • ✓ meetingNumber
  • ✓ signatures[1].role
  • ✓ signatures[1].title
  • ✓ resolutions[1].votesFor
  • ✓ resolutions[1].passed
  • ✓ resolutions[2].passed
  • ✓ resolutions[2].number
  • ✓ attendees._length
  • ✓ resolutions[0].title
  • ✓ secretary.name
  • ✓ resolutions[1].votesAgainst
  • ✓ attendees[0].name
  • ✓ attendees[1].title
  • ✓ resolutions[0].description
  • ✓ signatures[0].name
  • ✓ resolutions[1].abstentions
  • ✓ chairman.name
  • ✓ chairman.title
  • ✓ agendaItems[2]
  • ✓ resolutions[0].votesFor
  • ✓ absentees[0].name
  • ✓ resolutions[2].description
  • ✓ attendees[1].name
  • ✓ signatures._length
  • ✓ resolutions[1].title
  • ✓ resolutions[1].description
  • ✓ agendaItems[1]
  • ✓ signatures[1].signedDate
  • ✓ attendees[0].title
  • ✓ resolutions[0].passed
  • ✓ absentees._length
  • ✓ signatures[0].title
  • ✓ startTime
  • ✓ signatures[0].signedDate
  • ✓ agendaItems._length
  • ✓ date
  • ✓ resolutions[0].number
  • ✓ resolutions[2].abstentions
  • ✓ resolutions._length
Extracted Text from PDF
MEETING PROTOCOL
Meeting Type: BOARD MEETING
Meeting Number: 2026-5
Date: 2025-05-07
Time: 12:00 - 13:00
Location: Bartoletti LLC Headquarters, Linden
Officers
Chairman: Mrs. Tonya Doyle V (Regional Identity Representative)
Secretary: Terence Batz (Principal Factors Developer)
Attendees
• Jessie Schuster - District Web Planner
• Mike Feil - Central Directives Planner
• Eva Funk - Internal Identity Executive
Absent
• Mr. Clark Davis
Agenda
1. brand proactive infrastructures
2. deploy world-class niches
3. expedite next-generation experiences
Resolutions
Resolution 1: monetize B2C architectures
Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio
viridis tepidus.
Votes: For: 3, Against: 0, Abstentions: 0
Result: PASSED
Resolution 2: brand ubiquitous relationships
Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene
inflammatio.
Votes: For: 1, Against: 1, Abstentions: 1
Result: NOT PASSED
Resolution 3: monetize intuitive networks
Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne
vicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca
concedo ullus.
Votes: For: 3, Against: 0, Abstentions: 0
Result: PASSED
Notes
Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana
tenax.

Certification
We hereby certify that these minutes are an accurate record of the proceedings.
_______________________________
Chairman: Mrs. Tonya Doyle V
Regional Identity Representative
Date: 2025-05-07
_______________________________
Secretary: Terence Batz
Principal Factors Developer
Date: 2025-05-07
System Prompt
You are a precise document data extraction expert. Your task is to extract structured data from protocol documents.

## Extraction Guidelines

Extract meeting protocol data including:
- Meeting type, number, date, start/end times, location
- Chairman and secretary (name, title, email)
- Attendees and absentees (arrays of objects with name, title, email)
- Agenda items (array of strings)
- Resolutions (number, title, description, votes, passed status)

## Important Rules

1. **Dates**: Always use ISO format (YYYY-MM-DD) for full dates, HH:MM for times
2. **Currency**: Use 3-letter ISO 4217 codes (EUR, USD, GBP, etc.)
3. **Missing optional fields**: Omit them entirely, don't use null or empty strings
4. **Required fields**: Make your best effort to extract; if truly not present, use reasonable placeholder
5. **Numbers**: Extract as numeric values, not strings (except for identifiers like document numbers)
6. **Arrays**: Always return arrays even if only one item exists
7. **Text content**: Preserve important content accurately but you may summarize very long passages
8. **Names**: Extract full names as they appear in the document

Respond with a JSON object containing the extracted data. Be precise and extract only what is explicitly stated in the document.
User Prompt
Please extract all structured data from this protocol document:

---
MEETING PROTOCOL
Meeting Type: BOARD MEETING
Meeting Number: 2026-5
Date: 2025-05-07
Time: 12:00 - 13:00
Location: Bartoletti LLC Headquarters, Linden
Officers
Chairman: Mrs. Tonya Doyle V (Regional Identity Representative)
Secretary: Terence Batz (Principal Factors Developer)
Attendees
• Jessie Schuster - District Web Planner
• Mike Feil - Central Directives Planner
• Eva Funk - Internal Identity Executive
Absent
• Mr. Clark Davis
Agenda
1. brand proactive infrastructures
2. deploy world-class niches
3. expedite next-generation experiences
Resolutions
Resolution 1: monetize B2C architectures
Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio
viridis tepidus.
Votes: For: 3, Against: 0, Abstentions: 0
Result: PASSED
Resolution 2: brand ubiquitous relationships
Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene
inflammatio.
Votes: For: 1, Against: 1, Abstentions: 1
Result: NOT PASSED
Resolution 3: monetize intuitive networks
Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne
vicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca
concedo ullus.
Votes: For: 3, Against: 0, Abstentions: 0
Result: PASSED
Notes
Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana
tenax.

Certification
We hereby certify that these minutes are an accurate record of the proceedings.
_______________________________
Chairman: Mrs. Tonya Doyle V
Regional Identity Representative
Date: 2025-05-07
_______________________________
Secretary: Terence Batz
Principal Factors Developer
Date: 2025-05-07
---

Extract the data as JSON according to the schema.
Raw LLM Response
{
  "meetingType": "board_meeting",
  "date": "2025-05-07",
  "chairman": {
    "name": "Mrs. Tonya Doyle V",
    "title": "Regional Identity Representative"
  },
  "absentees": [
    {
      "name": "Mr. Clark Davis"
    }
  ],
  "signatures": [
    {
      "role": "Chairman",
      "name": "Mrs. Tonya Doyle V",
      "signedDate": "2025-05-07",
      "title": "Regional Identity Representative"
    },
    {
      "role": "Secretary",
      "name": "Terence Batz",
      "signedDate": "2025-05-07",
      "title": "Principal Factors Developer"
    }
  ],
  "agendaItems": [
    "brand proactive infrastructures",
    "deploy world-class niches",
    "expedite next-generation experiences"
  ],
  "attendees": [
    {
      "name": "Jessie Schuster",
      "title": "District Web Planner"
    },
    {
      "name": "Mike Feil",
      "title": "Central Directives Planner"
    },
    {
      "name": "Eva Funk",
      "title": "Internal Identity Executive"
    }
  ],
  "endTime": "13:00",
  "location": "Bartoletti LLC Headquarters, Linden",
  "meetingNumber": "2026-5",
  "notes": "Demens tyrannus anser. Calculus thema demergo officiis careo decimus creptio sperno. Statim in cito campana tenax.",
  "resolutions": [
    {
      "number": "1",
      "title": "monetize B2C architectures",
      "passed": true,
      "votesFor": 3,
      "votesAgainst": 0,
      "abstentions": 0,
      "description": "Antea dolore commodo suggero stultus. Calculus textilis argentum cena conduco ancilla aperio. Cunae adficio\nviridis tepidus."
    },
    {
      "number": "2",
      "title": "brand ubiquitous relationships",
      "passed": false,
      "votesFor": 1,
      "votesAgainst": 1,
      "abstentions": 1,
      "description": "Ager consequatur aperio summopere cunae. Admiratio atavus enim vivo rem cognatus adsum. Correptius bene\ninflammatio."
    },
    {
      "number": "3",
      "title": "monetize intuitive networks",
      "passed": true,
      "votesFor": 3,
      "votesAgainst": 0,
      "abstentions": 0,
      "description": "Sophismata turba vel coaegresco tunc cado calco barba undique solum. Adeptio officiis verbera hic benigne\nvicissitudo agnosco cupio conscendo summa. Conculco concido patior volaticus accusamus delicate arca\nconcedo ullus."
    }
  ],
  "secretary": {
    "name": "Terence Batz",
    "title": "Principal Factors Developer"
  },
  "startTime": "12:00"
}
JSON Schema (Structured Output)

This schema is passed to the LLM via ResponseSchema to enforce structured JSON output.

{
  "example": {
    "absentees": [],
    "agendaItems": [
      "1. Approval of Previous Meeting Minutes",
      "2. Financial Report Q1 2024",
      "3. Strategic Planning Discussion"
    ],
    "attendees": [
      {
        "name": "Michael Johnson",
        "title": "Chief Financial Officer"
      },
      {
        "name": "Sarah Williams",
        "title": "Chief Operating Officer"
      }
    ],
    "chairman": {
      "name": "John Smith",
      "title": "Chairman of the Board"
    },
    "date": "2024-03-15",
    "endTime": "12:00",
    "location": "Corporate Headquarters, Conference Room A",
    "meetingNumber": "2024-001",
    "meetingType": "board_meeting",
    "notes": "Meeting adjourned at 12:00 PM. Next meeting scheduled for April 15, 2024.",
    "resolutions": [
      {
        "abstentions": 0,
        "description": "The board approves the proposed Q1 2024 budget of $2.5 million.",
        "number": "1",
        "passed": true,
        "title": "Approval of Q1 Budget",
        "votesAgainst": 0,
        "votesFor": 4
      }
    ],
    "secretary": {
      "name": "Jane Doe",
      "title": "Corporate Secretary"
    },
    "signatures": [
      {
        "name": "John Smith",
        "role": "Chairman",
        "signedDate": "2024-03-15",
        "title": "Chairman of the Board"
      },
      {
        "name": "Jane Doe",
        "role": "Secretary",
        "signedDate": "2024-03-15",
        "title": "Corporate Secretary"
      }
    ],
    "startTime": "10:00"
  },
  "properties": {
    "absentees": {
      "description": "List of people who were absent from the meeting. Use empty array [] if no absentees.",
      "items": {
        "properties": {
          "email": {
            "description": "Email address",
            "type": "STRING"
          },
          "name": {
            "description": "Full name of the person",
            "type": "STRING"
          },
          "title": {
            "description": "Job title or role",
            "type": "STRING"
          }
        },
        "required": [
          "name"
        ],
        "type": "OBJECT"
      },
      "type": "ARRAY"
    },
    "agendaItems": {
      "items": {
        "type": "STRING"
      },
      "type": "ARRAY"
    },
    "attendees": {
      "items": {
        "properties": {
          "email": {
            "description": "Email address",
            "type": "STRING"
          },
          "name": {
            "description": "Full name of the person",
            "type": "STRING"
          },
          "title": {
            "description": "Job title or role",
            "type": "STRING"
          }
        },
        "required": [
          "name"
        ],
        "type": "OBJECT"
      },
      "type": "ARRAY"
    },
    "chairman": {
      "properties": {
        "email": {
          "description": "Email address",
          "type": "STRING"
        },
        "name": {
          "description": "Full name of the person",
          "type": "STRING"
        },
        "title": {
          "description": "Job title or role",
          "type": "STRING"
        }
      },
      "required": [
        "name"
      ],
      "type": "OBJECT"
    },
    "date": {
      "description": "Meeting date in YYYY-MM-DD format",
      "type": "STRING"
    },
    "endTime": {
      "description": "End time in HH:MM format",
      "type": "STRING"
    },
    "location": {
      "description": "Meeting location",
      "type": "STRING"
    },
    "meetingNumber": {
      "description": "Meeting reference number",
      "type": "STRING"
    },
    "meetingType": {
      "description": "Type of meeting",
      "enum": [
        "board_meeting",
        "shareholder_meeting",
        "annual_general_meeting",
        "extraordinary_general_meeting"
      ],
      "type": "STRING"
    },
    "notes": {
      "type": "STRING"
    },
    "resolutions": {
      "items": {
        "properties": {
          "abstentions": {
            "description": "Number of abstentions. Use 0 if none.",
            "type": "INTEGER"
          },
          "description": {
            "type": "STRING"
          },
          "number": {
            "type": "STRING"
          },
          "passed": {
            "type": "BOOLEAN"
          },
          "title": {
            "type": "STRING"
          },
          "votesAgainst": {
            "description": "Number of votes against",
            "type": "INTEGER"
          },
          "votesFor": {
            "description": "Number of votes in favor",
            "type": "INTEGER"
          }
        },
        "required": [
          "number",
          "title",
          "passed",
          "votesFor",
          "votesAgainst",
          "abstentions"
        ],
        "type": "OBJECT"
      },
      "type": "ARRAY"
    },
    "secretary": {
      "properties": {
        "email": {
          "description": "Email address",
          "type": "STRING"
        },
        "name": {
          "description": "Full name of the person",
          "type": "STRING"
        },
        "title": {
          "description": "Job title or role",
          "type": "STRING"
        }
      },
      "required": [
        "name"
      ],
      "type": "OBJECT"
    },
    "signatures": {
      "description": "Signatures certifying the protocol accuracy. Typically signed by chairman and secretary.",
      "items": {
        "properties": {
          "name": {
            "description": "Full name of the person signing",
            "type": "STRING"
          },
          "role": {
            "description": "Role of the signatory (e.g., Chairman, Secretary)",
            "type": "STRING"
          },
          "signedDate": {
            "description": "Date the protocol was signed in YYYY-MM-DD format",
            "type": "STRING"
          },
          "title": {
            "description": "Job title of the signatory",
            "type": "STRING"
          }
        },
        "required": [
          "role",
          "name",
          "signedDate"
        ],
        "type": "OBJECT"
      },
      "type": "ARRAY"
    },
    "startTime": {
      "description": "Start time in HH:MM format",
      "type": "STRING"
    }
  },
  "required": [
    "meetingType",
    "date",
    "chairman",
    "absentees",
    "signatures"
  ],
  "type": "OBJECT"
}