DOJ-OGR-00024643.json 1.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455
  1. {
  2. "document_metadata": {
  3. "page_number": "005",
  4. "document_number": "NYMDK 530*C7",
  5. "date": "08-06-2019",
  6. "document_type": "ROSTER",
  7. "has_handwriting": false,
  8. "has_stamps": false
  9. },
  10. "full_text": "NYMDK 530*C7 * PAGE 005 ROSTER = 08-06-2019 02:40:42 Z04A Z04-206LAD 763-8-034 EPSTEIN JEFFREY 07-08-2019 A-PRE DOJ-OGR-00024643",
  11. "text_blocks": [
  12. {
  13. "type": "printed",
  14. "content": "NYMDK 530*C7 * PAGE 005",
  15. "position": "header"
  16. },
  17. {
  18. "type": "printed",
  19. "content": "ROSTER",
  20. "position": "header"
  21. },
  22. {
  23. "type": "printed",
  24. "content": "08-06-2019 02:40:42",
  25. "position": "header"
  26. },
  27. {
  28. "type": "printed",
  29. "content": "Z04A Z04-206LAD 763-8-034 EPSTEIN JEFFREY 07-08-2019 A-PRE",
  30. "position": "middle"
  31. },
  32. {
  33. "type": "printed",
  34. "content": "DOJ-OGR-00024643",
  35. "position": "footer"
  36. }
  37. ],
  38. "entities": {
  39. "people": [
  40. "JEFFREY EPSTEIN"
  41. ],
  42. "organizations": [],
  43. "locations": [],
  44. "dates": [
  45. "08-06-2019",
  46. "07-08-2019"
  47. ],
  48. "reference_numbers": [
  49. "NYMDK 530*C7",
  50. "Z04A Z04-206LAD 763-8-034",
  51. "DOJ-OGR-00024643"
  52. ]
  53. },
  54. "additional_notes": "The majority of the document is obscured by a green rectangle, making most of the content unreadable. The visible text is extracted from the header, footer, and a single line in the middle."
  55. }