1539 lines
55 KiB
JSON
1539 lines
55 KiB
JSON
{
|
|
"meta": {
|
|
"model": "mistral",
|
|
"passes": 3,
|
|
"sample_size": 50,
|
|
"started": "2026-04-28T01:39:19.750205",
|
|
"completed": "2026-04-28T01:56:58.176009"
|
|
},
|
|
"documents": [
|
|
{
|
|
"id": "claude_bbe0172d-3087-4238-a51c-7dca6c0b6f28_1326",
|
|
"source": "Claude: Setting up a custom OpenClaw instance",
|
|
"content_hash": "0ff1319e",
|
|
"content_length": 700,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
13.6,
|
|
2.6,
|
|
2.5
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [
|
|
"30 days"
|
|
],
|
|
"document_type": "conversation"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"30 days\"],\n \"document_type\": \"conversation\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"30 days\"],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"30 days\"],\n \"document_type\": \"conversation\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "1a545c4e_432",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "5d6d9cf1",
|
|
"content_length": 2807,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
18.1,
|
|
3.6,
|
|
5.2
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"bloom",
|
|
"corny kelleher",
|
|
"first watch",
|
|
"second watch"
|
|
],
|
|
"organizations": [
|
|
"behan's",
|
|
"jammet's"
|
|
],
|
|
"locations": [
|
|
"gardiner street",
|
|
"nighttown",
|
|
"scaffolding"
|
|
],
|
|
"dates": [],
|
|
"document_type": "literature"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Bloom\", \"First Watch\", \"Second Watch\", \"Corny Kelleher\"],\n \"organizations\": [\"Jammet's\", \"Behan's\"],\n \"locations\": [\"Nighttown\", \"Gardiner street\", \"scaffolding\"],\n \"document_type\":",
|
|
"{\n \"people\": [\"BLOOM\", \"CORNY KELLEHER\", \"Father\"],\n \"locations\": [\"nighttown\", \"Gardiner street\"],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"Bloom\", \"Corny Kelleher\", \"First Watch\", \"Second Watch\", \"Father\"],\n \"organizations\": [],\n \"locations\": [\"Gardiner street\", \"nighttown\", \"Jammet's\"],\n \"dates\": [],\n \"document_type\""
|
|
]
|
|
},
|
|
{
|
|
"id": "claude_bbe0172d-3087-4238-a51c-7dca6c0b6f28_430",
|
|
"source": "Claude: Setting up a custom OpenClaw instance",
|
|
"content_hash": "37dc9e1c",
|
|
"content_length": 2937,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
19.0,
|
|
2.2,
|
|
2.2
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [
|
|
"aaronnelson.studio",
|
|
"nextcloud"
|
|
],
|
|
"locations": [
|
|
"nextcloud.aaronnelson.studio"
|
|
],
|
|
"dates": [],
|
|
"document_type": "text"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [\"Nextcloud\", \"aaronnelson.studio\"],\n \"locations\": [\"nextcloud.aaronnelson.studio\"],\n \"dates\": [],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"locations\": [\"nextcloud.aaronnelson.studio\"],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"locations\": [\"nextcloud.aaronnelson.studio\"],\n \"document_type\": \"plain text\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "0e18a972_12",
|
|
"source": "RH50-TM-L1-EN-20140902.pdf",
|
|
"content_hash": "dd1e2907",
|
|
"content_length": 2709,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.8,
|
|
2.7,
|
|
3.2
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"robert mcneel"
|
|
],
|
|
"organizations": [
|
|
"robert mcneel & associates"
|
|
],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": ""
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Robert McNeel\"],\n \"organizations\": [\"Robert McNeel & Associates\"]\n}",
|
|
"{\n \"people\": [\"Robert McNeel\"],\n \"organizations\": [\"Robert McNeel & Associates\"],\n \"document_type\": \"instructions\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [\"Robert McNeel & Associates\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Instruction manual\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "1a545c4e_197",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "d911e3fd",
|
|
"content_length": 2741,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
16.4,
|
|
5.9,
|
|
5.8
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"girlgold",
|
|
"hugh machugh",
|
|
"kennedy",
|
|
"lenehan",
|
|
"miss douce",
|
|
"mr dedalus",
|
|
"stephen"
|
|
],
|
|
"organizations": [
|
|
"mooney's en ville",
|
|
"mooney's sur mer"
|
|
],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "fiction"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Kennedy\", \"girlgold\", \"Miss Douce\", \"Stephen\", \"Lenehan\", \"Mr Dedalus\", \"Hugh MacHugh\"],\n \"organizations\": [\"Mooney's EN VILLE\", \"Mooney's SUR MER\"],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"Kennedy\", \"Miss Douce\", \"Lenehan\", \"Stephen\", \"Mr Dedalus\", \"Hugh MacHugh\"],\n \"organizations\": [\"Mooney's EN VILLE\", \"Mooney's SUR MER\"],\n \"locations\": [],\n \"dates\": [],\n \"document",
|
|
"{\n \"people\": [\"Kennedy\", \"Mr Dedalus\", \"Lenehan\", \"Stephen\", \"Hugh MacHugh\"],\n \"organizations\": [],\n \"locations\": [\"Mooney's EN VILLE\", \"Mooney's SUR MER\"],\n \"dates\": [],\n \"document_type\": \"ficti"
|
|
]
|
|
},
|
|
{
|
|
"id": "88602096_2",
|
|
"source": "Kingston Grads Ind Study SP2023 Syllabus.pdf",
|
|
"content_hash": "43b2ec27",
|
|
"content_length": 2525,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
15.7,
|
|
7.2,
|
|
7.0
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"members",
|
|
"students"
|
|
],
|
|
"organizations": [
|
|
"dean of your school",
|
|
"department chair",
|
|
"office of human resources, diversity & inclusion (hrdi)",
|
|
"suny new paltz",
|
|
"title ix office"
|
|
],
|
|
"locations": [
|
|
"campus buildings",
|
|
"new paltz",
|
|
"student union, room 100 south"
|
|
],
|
|
"dates": [],
|
|
"document_type": "policy statement"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"members\", \"students\"],\n \"organizations\": [\"SUNY New Paltz\", \"Title IX Office\", \"department chair\", \"dean of your school\", \"Office of Human Resources, Diversity & Inclusion (HRDI)\"],\n ",
|
|
"{\n \"people\": [\"members\", \"students\"],\n \"organizations\": [\"SUNY New Paltz\", \"Title IX Office\", \"department chair and/or the dean of your school\", \"Office of Human Resources, Diversity & Inclusion (HR",
|
|
"{\n \"people\": [\"members\", \"students\"],\n \"organizations\": [\"SUNY New Paltz\", \"Title IX Office\", \"department chair\", \"dean of your school\", \"Office of Human Resources, Diversity & Inclusion (HRDI)\"],\n "
|
|
]
|
|
},
|
|
{
|
|
"id": "7785818c_1",
|
|
"source": "The Extended Mind _ The Power of Thinking Outside the Brain -- Annie Murphy Paul.pdf",
|
|
"content_hash": "48faec1d",
|
|
"content_length": 2891,
|
|
"status": "CONSISTENT",
|
|
"consistent": true,
|
|
"pass_times_seconds": [
|
|
12.5,
|
|
3.4,
|
|
3.3
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"fr\u00e9d\u00e9ric gros",
|
|
"nietzsche"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Nietzsche\", \"Fr\u00e9d\u00e9ric Gros\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"Nietzsche\", \"Fr\u00e9d\u00e9ric Gros\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"Nietzsche\", \"Fr\u00e9d\u00e9ric Gros\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "1a545c4e_3",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "73ad0e8d",
|
|
"content_length": 2733,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
13.8,
|
|
3.8,
|
|
3.7
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"buck mulligan",
|
|
"stephen",
|
|
"ursula"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"irish art",
|
|
"island"
|
|
],
|
|
"dates": [],
|
|
"document_type": "fiction"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Stephen\", \"Buck Mulligan\", \"Ursula\"],\n \"organizations\": [],\n \"locations\": [\"Irish art\", \"Island\"],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"Stephen\", \"Buck Mulligan\", \"Ursula\"],\n \"organizations\": [],\n \"locations\": [\"Irish art\", \"the island\"],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"Stephen\", \"Buck Mulligan\", \"Ursula\"],\n \"organizations\": [],\n \"locations\": [\"Irish island\"],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "1a545c4e_46",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "f42b21d0",
|
|
"content_length": 2833,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
15.3,
|
|
3.5,
|
|
3.4
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"eleven",
|
|
"she"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"dolphin's barn"
|
|
],
|
|
"dates": [],
|
|
"document_type": "book title (assumed from 'ruby: the pride of the ring')"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Eleven\", \"She\"],\n \"organizations\": [],\n \"locations\": [\"Dolphin's Barn\"],\n \"dates\": [],\n \"document_type\": \"Book Title (assumed from 'RUBY: THE PRIDE OF THE RING')\"\n}",
|
|
"{\n \"people\": [\"Eleven\", \"She\"],\n \"organizations\": [],\n \"locations\": [\"Dolphin's Barn\"],\n \"dates\": [],\n \"document_type\": \"Book\"\n}",
|
|
"{\n \"people\": [\"Eleven\", \"She\"],\n \"organizations\": [],\n \"locations\": [\"Dolphin's Barn\"],\n \"dates\": [],\n \"document_type\": \"book\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "9d366a6a_2",
|
|
"source": "Circuit Intro.pptx",
|
|
"content_hash": "5467e94e",
|
|
"content_length": 2946,
|
|
"status": "CONSISTENT",
|
|
"consistent": true,
|
|
"pass_times_seconds": [
|
|
11.7,
|
|
2.4,
|
|
2.5
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "text"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"text\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "49e3545d_33",
|
|
"source": "RH50-TM-L1-EN-20140902.pdf",
|
|
"content_hash": "6e608b0e",
|
|
"content_length": 2928,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
12.0,
|
|
3.2,
|
|
3.3
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [
|
|
"robert mcneel & associates"
|
|
],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "model"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [\"Robert McNeel & Associates\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"model\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [\"Robert McNeel & Associates\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Cplanes.3dm\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [\"Robert McNeel & Associates\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Cplanes.3dm\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "fc378df0_203",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "eb17907a",
|
|
"content_length": 2945,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
14.6,
|
|
4.7,
|
|
4.9
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"ben dollard",
|
|
"george lidwell",
|
|
"lydia douce"
|
|
],
|
|
"organizations": [
|
|
"the independent"
|
|
],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "fiction"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Ben Dollard\", \"Lydia Douce\", \"George Lidwell\"],\n \"organizations\": [\"The INDEPENDENT\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Fiction\"\n}",
|
|
"{\n \"people\": [\"Bloom\", \"Molly\", \"Ben Dollard\", \"Miss Douce\", \"Lydia Douce\", \"George Lidwell\"],\n \"organizations\": [\"INDEPENDENT\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"Bloom\", \"Molly\", \"Ben Dollard\", \"Miss Douce\", \"Lydia Douce\", \"George Lidwell\"],\n \"organizations\": [\"INDEPENDENT\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"newspaper arti"
|
|
]
|
|
},
|
|
{
|
|
"id": "1a545c4e_12",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "2d5907e9",
|
|
"content_length": 2800,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
13.3,
|
|
3.5,
|
|
4.3
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"buck mulligan",
|
|
"haines",
|
|
"stephen"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"bay",
|
|
"elsinore",
|
|
"sea"
|
|
],
|
|
"dates": [],
|
|
"document_type": "literature"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Stephen\", \"Haines\", \"Buck Mulligan\"],\n \"locations\": [\"Elsinore\", \"sea\", \"bay\"],\n \"document_type\": \"literature\"\n}",
|
|
"{\n \"people\": [\"Stephen\", \"Haines\", \"Buck Mulligan\"],\n \"organizations\": [],\n \"locations\": [\"Elsinore\"],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"Stephen\", \"Haines\", \"Buck Mulligan\"],\n \"organizations\": [],\n \"locations\": [\"Elsinore\", \"Sea\", \"Bay\", \"Muglins\"],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "e6101efc_1",
|
|
"source": "3D Printing \u2013 Designing for Additive2.pptx",
|
|
"content_hash": "7bb3f96b",
|
|
"content_length": 639,
|
|
"status": "CONSISTENT",
|
|
"consistent": true,
|
|
"pass_times_seconds": [
|
|
11.1,
|
|
2.9,
|
|
2.3
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [
|
|
"hvamc"
|
|
],
|
|
"locations": [],
|
|
"dates": [
|
|
"2017"
|
|
],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"document_type\": \"article\",\n \"locations\": [],\n \"people\": [],\n \"organizations\": [\"HVAMC\"],\n \"dates\": [\"2017\"]\n}",
|
|
"{\n \"document_type\": \"article\",\n \"organizations\": [\"HVAMC\"],\n \"locations\": [],\n \"dates\": [\"2017\"],\n \"people\": []\n}",
|
|
"{\n \"organizations\": [\"HVAMC\"],\n \"dates\": [\"2017\"],\n \"document_type\": \"article\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "fc378df0_79",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "f9333d86",
|
|
"content_length": 2691,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
14.3,
|
|
4.5,
|
|
3.5
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"dedalus",
|
|
"father coffey"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"saint werburgh's"
|
|
],
|
|
"dates": [],
|
|
"document_type": "novel"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Father Coffey\", \"Dedalus\"],\n \"organizations\": [],\n \"locations\": [\"Saint Werburgh's\"],\n \"dates\": [],\n \"document_type\": \"novel\"\n}",
|
|
"{\n \"people\": [\"Father Coffey\", \"Dedalus\", \"Molly\", \"Mervyn Browne\"],\n \"organizations\": [],\n \"locations\": [\"Saint Werburgh's\"],\n \"dates\": [],\n \"document_type\": \"novel\"\n}",
|
|
"{\n \"people\": [\"Father Coffey\", \"Dedalus\"],\n \"organizations\": [],\n \"locations\": [\"Saint Werburgh's\"],\n \"dates\": [],\n \"document_type\": \"novel\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "25df23c5_0",
|
|
"source": "MIC Work Instructions.docx",
|
|
"content_hash": "542035c0",
|
|
"content_length": 2192,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.3,
|
|
2.9,
|
|
3.3
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"users"
|
|
],
|
|
"organizations": [
|
|
"mic",
|
|
"newpaltz"
|
|
],
|
|
"locations": [
|
|
"print center"
|
|
],
|
|
"dates": [],
|
|
"document_type": "email"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"users\"],\n \"organizations\": [\"Newpaltz\", \"MIC\"],\n \"locations\": [\"print center\"],\n \"document_type\": \"email\"\n}",
|
|
"{\n \"people\": [\"users\"],\n \"organizations\": [\"Newpaltz.edu\", \"MIC\"],\n \"locations\": [\"print center\"],\n \"document_type\": \"email\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [\"Newpaltz\", \"MIC\"],\n \"locations\": [\"print center\"],\n \"dates\": [],\n \"document_type\": \"email\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "7369fb88_0",
|
|
"source": "Selected FDM Materials - EN Chemical Compatibility (2).pdf",
|
|
"content_hash": "9577291b",
|
|
"content_length": 2976,
|
|
"status": "CONSISTENT",
|
|
"consistent": true,
|
|
"pass_times_seconds": [
|
|
13.5,
|
|
3.0,
|
|
2.9
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [
|
|
"stratasys"
|
|
],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "data sheet"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [\"Stratasys\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Data Sheet\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [\"Stratasys\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Data Sheet\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [\"Stratasys\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Data Sheet\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "a230f2c3_593",
|
|
"source": "Landscape And Memory -- Simon Schama.pdf",
|
|
"content_hash": "b9bb7299",
|
|
"content_length": 1373,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
23.8,
|
|
7.0,
|
|
6.1
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"carlo ginzburg",
|
|
"john hutchin",
|
|
"leo wieseltier"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"greenwood"
|
|
],
|
|
"dates": [
|
|
"1774",
|
|
"1808",
|
|
"1990",
|
|
"aug. 5, 1991"
|
|
],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Carlo Ginzburg\", \"John Hutchin\", \"Leo Wieseltier\"],\n \"organizations\": [],\n \"locations\": [\"Greenwood\"],\n \"dates\": [\"1990\", \"Aug. 5, 1991\", \"1774\", \"1808\"],\n \"document_type\": \"articl",
|
|
"{\n \"people\": [\"Cambell\", \"American Scholar\", \"Carlo Ginzburg\", \"Leo Weiseltier\"],\n \"organizations\": [],\n \"locations\": [\"Greenwood\"],\n \"dates\": [\"1990\", \"Aug. 5, 1991\", \"1774\", \"1808\"],\n \"document",
|
|
"{\n \"people\": [\"Carlo Ginzburg\", \"John Hutchin\", \"Leon Weiseltier\"],\n \"organizations\": [],\n \"locations\": [\"Greenwood\", \"Dorset\", \"London\"],\n \"dates\": [\"1990\", \"1774\", \"1808\"],\n \"document_type\": \"a"
|
|
]
|
|
},
|
|
{
|
|
"id": "91ccefdd_35",
|
|
"source": "Cognition in the Wild (A Bradford Book) -- Hutchins, Edwin.pdf",
|
|
"content_hash": "02c3beb2",
|
|
"content_length": 2722,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.5,
|
|
3.0,
|
|
3.0
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [
|
|
"region around the ship",
|
|
"shore"
|
|
],
|
|
"dates": [],
|
|
"document_type": "book"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [\"region around the ship\", \"shore\"],\n \"dates\": [],\n \"document_type\": \"book\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [\"region around the ship\", \"ship\"],\n \"dates\": [],\n \"document_type\": \"book\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [\"region around the ship\", \"shore\"],\n \"dates\": [],\n \"document_type\": \"book\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "a230f2c3_310",
|
|
"source": "Landscape And Memory -- Simon Schama.pdf",
|
|
"content_hash": "310615d5",
|
|
"content_length": 2808,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
14.6,
|
|
4.8,
|
|
4.8
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"keymis",
|
|
"ralegh"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"england",
|
|
"greenwich",
|
|
"newfoundland",
|
|
"plymouth",
|
|
"thames estuary",
|
|
"westminster"
|
|
],
|
|
"dates": [
|
|
"29"
|
|
],
|
|
"document_type": "letter"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Ralegh\", \"Keymis\"],\n \"organizations\": [],\n \"locations\": [\"Greenwich\", \"Westminster\", \"Plymouth\", \"Thames Estuary\", \"England\", \"Newfoundland\"],\n \"dates\": [\"29\"],\n \"document_type\": \"",
|
|
"{\n \"people\": [\"Ralegh\", \"Keymis\", \"Queen\"],\n \"locations\": [\"Keymis\", \"cabin\", \"Newfoundland\", \"Plymouth\", \"Thames estuary\", \"France\", \"Greenwich\", \"Westminster\"],\n \"document_type\": \"letter\"\n}",
|
|
"{\n \"people\": [\"Sir Walter Ralegh\", \"Keymis\"],\n \"locations\": [\"miserable Keymis\", \"cabin\", \"Newfoundland\", \"Plymouth\", \"Thames estuary\", \"Greenwich\", \"Westminster\"],\n \"document_type\": \"historical do"
|
|
]
|
|
},
|
|
{
|
|
"id": "claude_bbe0172d-3087-4238-a51c-7dca6c0b6f28_280",
|
|
"source": "Claude: Setting up a custom OpenClaw instance",
|
|
"content_hash": "995c8e57",
|
|
"content_length": 1454,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
15.6,
|
|
3.0,
|
|
3.5
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"aaron"
|
|
],
|
|
"organizations": [
|
|
"aaronnelson.studio"
|
|
],
|
|
"locations": [],
|
|
"dates": [
|
|
"thu, 23 apr 2026"
|
|
],
|
|
"document_type": "text"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"aaron\"],\n \"organizations\": [\"aaronnelson.studio\"],\n \"dates\": [\"Thu, 23 Apr 2026\"],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"people\": [\"aaronnelson\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"people\": [\"aaron\"],\n \"organizations\": [\"aaronnelson.studio\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"text\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "91ccefdd_125",
|
|
"source": "Cognition in the Wild (A Bradford Book) -- Hutchins, Edwin.pdf",
|
|
"content_hash": "8a85596b",
|
|
"content_length": 2893,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
10.9,
|
|
2.8,
|
|
2.6
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "text"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"manual\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"instruction\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "074bb5f9_85",
|
|
"source": "Mystery train _ images of America in rock 'n' roll music -- Marcus, Greil.pdf",
|
|
"content_hash": "ac830289",
|
|
"content_length": 2702,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
13.1,
|
|
3.8,
|
|
4.0
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"staggerlee",
|
|
"superflake",
|
|
"taxi man"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"harlem"
|
|
],
|
|
"dates": [],
|
|
"document_type": "movie_review"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Superflake\", \"Taxi Man\", \"Staggerlee\"],\n \"organizations\": [],\n \"locations\": [\"Harlem\"],\n \"dates\": [],\n \"document_type\": \"movie_review\"\n}",
|
|
"{\n \"people\": [\"Taxi Man\", \"Staggerlee\", \"Superflake\", \"Franciosa\"],\n \"organizations\": [],\n \"locations\": [\"Harlem\"],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"Superflake\", \"Taxi Man\", \"Staggerlee\", \"Fats Domino\"],\n \"organizations\": [],\n \"locations\": [\"Harlem\"],\n \"dates\": [],\n \"document_type\": \"movie script\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "9cf798f8_74",
|
|
"source": "Shop Class as Soulcraft An inquiry into the value of the -- Crawford, Matthew.pdf",
|
|
"content_hash": "22d20263",
|
|
"content_length": 2704,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.6,
|
|
2.4,
|
|
2.5
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"locations\": [],\n \"people\": [],\n \"organizations\": [],\n \"dates\": [],\n \"document_type\": \"story\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "a230f2c3_84",
|
|
"source": "Landscape And Memory -- Simon Schama.pdf",
|
|
"content_hash": "39832bd0",
|
|
"content_length": 2725,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.6,
|
|
1.7,
|
|
1.9
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [
|
|
"germania"
|
|
],
|
|
"dates": [],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"locations\": [\"Germania\"],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"locations\": [\"Germania\"],\n \"document_type\": \"Historical Text\"\n}",
|
|
"{\n \"locations\": [\"Germania\", \"Latinized Gaul\"],\n \"document_type\": \"article\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "91ccefdd_282",
|
|
"source": "Cognition in the Wild (A Bradford Book) -- Hutchins, Edwin.pdf",
|
|
"content_hash": "a27a5292",
|
|
"content_length": 2868,
|
|
"status": "CONSISTENT",
|
|
"consistent": true,
|
|
"pass_times_seconds": [
|
|
10.3,
|
|
2.6,
|
|
2.6
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"quartermaster chief"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"quartermaster chief\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"quartermaster chief\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"quartermaster chief\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "fc378df0_53",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "62d1a05e",
|
|
"content_length": 2797,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
14.7,
|
|
5.3,
|
|
4.1
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"griffith",
|
|
"henry flower",
|
|
"maud gonne"
|
|
],
|
|
"organizations": [
|
|
"p. o.",
|
|
"royal dublin fusiliers"
|
|
],
|
|
"locations": [
|
|
"city",
|
|
"westland row"
|
|
],
|
|
"dates": [],
|
|
"document_type": "letter"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Henry Flower\", \"Maud Gonne\", \"Griffith\"],\n \"organizations\": [\"P. O.\", \"Royal Dublin fusiliers\"],\n \"locations\": [\"Westland Row\", \"City\"],\n \"document_type\": \"letter\"\n}",
|
|
"{\n \"people\": [\"Henry Flower\", \"Maud Gonne\", \"old Tweedy\"],\n \"organizations\": [\"P.O.\", \"Royal Dublin fusiliers\", \"King's own\"],\n \"locations\": [\"Westland Row\", \"City\", \"O'Connell street\"],\n \"documen",
|
|
"{\n \"people\": [\"Henry Flower\", \"Maud Gonne\", \"Griffith\"],\n \"organizations\": [],\n \"locations\": [\"City\", \"Westland Row\"],\n \"dates\": [],\n \"document_type\": \"letter\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "074bb5f9_27",
|
|
"source": "Mystery train _ images of America in rock 'n' roll music -- Marcus, Greil.pdf",
|
|
"content_hash": "075f007a",
|
|
"content_length": 2752,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
13.2,
|
|
4.1,
|
|
4.2
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"michael jackson",
|
|
"mick jagger",
|
|
"muddy waters",
|
|
"robert johnson"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [
|
|
"thirties",
|
|
"two hundred years ago"
|
|
],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Robert Johnson\", \"Muddy Waters\", \"Mick Jagger\", \"Michael Jackson\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"two hundred years ago\", \"thirties\"],\n \"document_type\": \"arti",
|
|
"{\n \"people\": [\"Robert Johnson\", \"Muddy Waters\", \"Mick Jagger\", \"Michael Jackson\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"two hundred years ago\"],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"man\", \"Robert Johnson\", \"Son House\", \"Skip James\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"more than two hundred years ago\", \"the thirties\"],\n \"document_type\": \"articl"
|
|
]
|
|
},
|
|
{
|
|
"id": "7ec60c0a_2",
|
|
"source": "Slide Slam 2022 Bios.docx",
|
|
"content_hash": "20fbe52c",
|
|
"content_length": 1435,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.5,
|
|
3.0,
|
|
3.1
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"alex",
|
|
"briana rascoe"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Alex\", \"Briana Rascoe\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"Alex\", \"Briana Rascoe\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"Alex\", \"Briana Rascoe\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"news article\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "fec527fe_1",
|
|
"source": "Lecture 2 Update.pptx",
|
|
"content_hash": "cb8c74a3",
|
|
"content_length": 2704,
|
|
"status": "CONSISTENT",
|
|
"consistent": true,
|
|
"pass_times_seconds": [
|
|
17.8,
|
|
3.2,
|
|
2.7
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [
|
|
"(300, 300)",
|
|
"(640, 384)"
|
|
],
|
|
"dates": [],
|
|
"document_type": "text"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"locations\": [\"(300, 300)\", \"(640, 384)\"],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"locations\": [\"(300, 300)\", \"(640, 384)\"],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"locations\": [\"(300, 300)\", \"(640, 384)\"],\n \"document_type\": \"text\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "1a545c4e_389",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "2aeec086",
|
|
"content_length": 2874,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
19.9,
|
|
4.2,
|
|
4.0
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"best",
|
|
"he",
|
|
"john eglinton",
|
|
"mananaun maclir"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "fiction"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"He\", \"Best\", \"John Eglinton\", \"Mananaun MacLir\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"Beer\", \"Bishop\", \"He is our friend\", \"Mananan MacLir\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"He\", \"BEST\", \"John Eglinton\", \"Mananau MacLir\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"literature\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "76c315b5_1",
|
|
"source": "CAD I Syllabus-SP19_Revised.docx",
|
|
"content_hash": "71d1c925",
|
|
"content_length": 2983,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
14.7,
|
|
6.6,
|
|
9.5
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [
|
|
"new paltz",
|
|
"sojourner truth library"
|
|
],
|
|
"locations": [
|
|
"http://lib.newpaltz.edu/assistance/plag.html",
|
|
"https://www.newpaltz.edu/emergency/policy.html"
|
|
],
|
|
"dates": [
|
|
"april 2nd"
|
|
],
|
|
"document_type": "academic policy document"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [\"New Paltz\", \"Sojourner Truth Library\"],\n \"locations\": [\"https://www.newpaltz.edu/emergency/policy.html\", \"http://lib.newpaltz.edu/assistance/plag.html\"],\n \"dat",
|
|
"{\n \"people\": [],\n \"organizations\": [\"New Paltz\", \"Sojourner Truth Library\"],\n \"locations\": [\"https://www.newpaltz.edu/emergency/policy.html\", \"http://lib.newpaltz.edu/assistance/plag.html\"],\n \"dat",
|
|
"Services Office at New Paltz as soon as possible. The office can be reached at 845-257-3106 or via email at [disability@newpaltz.edu](mailto:disability@newpaltz.edu). Accommodations must be approved i"
|
|
]
|
|
},
|
|
{
|
|
"id": "074bb5f9_442",
|
|
"source": "Mystery train _ images of America in rock 'n' roll music -- Marcus, Greil.pdf",
|
|
"content_hash": "197e4a86",
|
|
"content_length": 1303,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
17.9,
|
|
7.9,
|
|
6.3
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"bruce springsteen",
|
|
"elvis presley",
|
|
"greil marcus",
|
|
"lyle lovett",
|
|
"patty loveless",
|
|
"randy newman"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [
|
|
"16",
|
|
"20",
|
|
"232",
|
|
"3",
|
|
"307"
|
|
],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Elvis Presley\", \"Patty Loveless\", \"Randy Newman\", \"Lyle Lovett\", \"Greil Marcus\", \"Bruce Springsteen\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"16\", \"232\", \"307\", \"3\", \"2",
|
|
"{\n \"people\": [\"Elvis Presley\", \"Patty Loveless\", \"Randy Newman\", \"Lyle Lovett\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"20 years before the 1975\", \"16\", \"232\", \"307\", \"3 11\", \"34\"],\n ",
|
|
"{\n \"people\": [\"Elvis Presley\", \"Patty Loveless\", \"Randy Newman\", \"Lyle Lovett\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"16\", \"337\", \"232\", \"307\", \"3\", \"20 years before\", \"1975\"],\n \"d"
|
|
]
|
|
},
|
|
{
|
|
"id": "a230f2c3_599",
|
|
"source": "Landscape And Memory -- Simon Schama.pdf",
|
|
"content_hash": "4cf471ff",
|
|
"content_length": 2271,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
24.8,
|
|
8.3,
|
|
8.4
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"alexander hunter",
|
|
"batty langley",
|
|
"charnock",
|
|
"e. p. thompson",
|
|
"roger fisher",
|
|
"sir henry wood"
|
|
],
|
|
"organizations": [
|
|
"house of commons committee of inquiry",
|
|
"royal society of arts"
|
|
],
|
|
"locations": [
|
|
"london"
|
|
],
|
|
"dates": [
|
|
"1728",
|
|
"1771",
|
|
"1772",
|
|
"1789",
|
|
"1800-2",
|
|
"1912",
|
|
"1975"
|
|
],
|
|
"document_type": "book"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Charnock\", \"Batty Langley\", \"E. P. Thompson\", \"Roger Fisher\", \"Sir Henry Wood\", \"Alexander Hunter\"],\n \"organizations\": [\"House of Commons committee of inquiry\", \"Royal Society of Arts",
|
|
"{\n \"people\": [\"Charnock\", \"Batty Langley\", \"E. P. Thompson\", \"Roger Fisher\", \"Sir Henry Wood\", \"Alexander Hunter\"],\n \"organizations\": [\"House of Commons committee of inquiry\", \"Royal Society of Arts",
|
|
"{\n \"people\": [\"Charnock\", \"Batty Langley\", \"E. P. Thompson\", \"Roger Fisher\", \"Sir Henry Wood\", \"Alexander Hunter\"],\n \"organizations\": [\"The Royal Society of Arts\", \"House of Commons committee of inq"
|
|
]
|
|
},
|
|
{
|
|
"id": "074bb5f9_90",
|
|
"source": "Mystery train _ images of America in rock 'n' roll music -- Marcus, Greil.pdf",
|
|
"content_hash": "7e625551",
|
|
"content_length": 2748,
|
|
"status": "CONSISTENT",
|
|
"consistent": true,
|
|
"pass_times_seconds": [
|
|
14.0,
|
|
2.8,
|
|
2.8
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"richard avedon",
|
|
"rosie stone",
|
|
"sly"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [
|
|
"1973"
|
|
],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Sly\", \"Richard Avedon\", \"Rosie Stone\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"1973\"],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"Sly\", \"Richard Avedon\", \"Rosie Stone\"],\n \"dates\": [\"1973\"],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"Sly\", \"Richard Avedon\", \"Rosie Stone\"],\n \"dates\": [\"1973\"],\n \"document_type\": \"article\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "fc378df0_355",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "5a4d6725",
|
|
"content_length": 2883,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
20.4,
|
|
4.4,
|
|
4.9
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"bloom",
|
|
"bridie kelly",
|
|
"mrs marion",
|
|
"sweny"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"east",
|
|
"south"
|
|
],
|
|
"dates": [],
|
|
"document_type": "literature"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Mrs Marion\", \"Bloom\", \"Sweny\", \"Bridie Kelly\"],\n \"organizations\": [],\n \"locations\": [\"South\", \"East\"],\n \"dates\": [],\n \"document_type\": \"literature\"\n}",
|
|
"{\n \"people\": [\"Mrs Marion\", \"Bloom\", \"Sweny\", \"Marion\"],\n \"organizations\": [],\n \"locations\": [\"South\", \"East\", \"Hatch street\"],\n \"dates\": [],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"Mrs Marion\", \"Bloom\", \"Marion\", \"Sweny\", \"Bawd\", \"Bridie Kelly\"],\n \"organizations\": [],\n \"locations\": [\"South\", \"East\"],\n \"dates\": [],\n \"document_type\": \"Fiction\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "211f2199_71",
|
|
"source": "The E-myth revisited _ why most small businesses don't work -- Michael E_ Gerber.pdf",
|
|
"content_hash": "11665e8e",
|
|
"content_length": 2809,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.3,
|
|
2.6,
|
|
2.9
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"sarah"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "letter"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Sarah\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"letter\"\n}",
|
|
"{\n \"people\": [\"Sarah\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"business\"\n}",
|
|
"{\n \"people\": [\"Sarah\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"text\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "3ab67806_0",
|
|
"source": "CMakeLists.txt",
|
|
"content_hash": "15a52de3",
|
|
"content_length": 1020,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
7.9,
|
|
0.9,
|
|
0.9
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "cmake script"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"document_type\": \"cmake script\"\n}",
|
|
"{\n \"document_type\": \"cmake script\"\n}",
|
|
"{\n \"document_type\": \"cmake\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "eab75ec0_0",
|
|
"source": "CMakeLists.txt",
|
|
"content_hash": "d3d4f035",
|
|
"content_length": 1881,
|
|
"status": "CONSISTENT",
|
|
"consistent": true,
|
|
"pass_times_seconds": [
|
|
13.9,
|
|
1.0,
|
|
1.0
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "cmake file"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"document_type\": \"CMake file\"\n}",
|
|
"{\n \"document_type\": \"CMake file\"\n}",
|
|
"{\n \"document_type\": \"CMake file\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "293288df_31",
|
|
"source": "RhinoPythonPrimerRev3.pdf",
|
|
"content_hash": "6400418d",
|
|
"content_length": 2742,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.2,
|
|
0.9,
|
|
2.0
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [
|
|
"(0,0,0)"
|
|
],
|
|
"dates": [],
|
|
"document_type": "code"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"document_type\": \"code\",\n \"locations\": [\"(0,0,0)\"]\n}",
|
|
"{\n \"document_type\": \"code\"\n}",
|
|
"{\n \"document_type\": \"code\",\n \"locations\": [\"(0,0,0)\"]\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "f6a8d07a_18",
|
|
"source": "Arduino Microcontroller Basics.pdf",
|
|
"content_hash": "b4c3f332",
|
|
"content_length": 2669,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.3,
|
|
2.6,
|
|
2.9
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "arduino code"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Arduino Code\"\n}",
|
|
"{\n \"locations\": [],\n \"organizations\": [\"Arduino\"],\n \"people\": [],\n \"dates\": [],\n \"document_type\": \"program\"\n}",
|
|
"{\n \"document_type\": \"programming code\",\n \"locations\": [],\n \"people\": [],\n \"organizations\": [],\n \"dates\": []\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "05b9d711_116",
|
|
"source": "Company of One -- Paul Jarvis.pdf",
|
|
"content_hash": "6e7a4314",
|
|
"content_length": 2945,
|
|
"status": "CONSISTENT",
|
|
"consistent": true,
|
|
"pass_times_seconds": [
|
|
12.3,
|
|
3.1,
|
|
2.6
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"derek"
|
|
],
|
|
"organizations": [
|
|
"cdbaby"
|
|
],
|
|
"locations": [],
|
|
"dates": [
|
|
"2008"
|
|
],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Derek\"],\n \"organizations\": [\"CDBaby\"],\n \"locations\": [],\n \"dates\": [\"2008\"],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"Derek\"],\n \"organizations\": [\"CDBaby\"],\n \"locations\": [],\n \"dates\": [\"2008\"],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"Derek\"],\n \"organizations\": [\"CDBaby\"],\n \"dates\": [\"2008\"],\n \"document_type\": \"article\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "a8366d89_185",
|
|
"source": "Hackers and Painters_ Big Ideas from the Computer Age -- Graham, Paul.pdf",
|
|
"content_hash": "40a71745",
|
|
"content_length": 2878,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
13.1,
|
|
3.6,
|
|
4.3
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"harvard",
|
|
"princeton"
|
|
],
|
|
"organizations": [
|
|
"national center for education statistics"
|
|
],
|
|
"locations": [],
|
|
"dates": [
|
|
"1800",
|
|
"1970"
|
|
],
|
|
"document_type": "book chapter"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Princeton\", \"Harvard\"],\n \"organizations\": [\"National Center for Education Statistics\"],\n \"locations\": [],\n \"dates\": [\"1970\", \"1800\"],\n \"document_type\": \"book chapter\"\n}",
|
|
"{\n \"people\": [\"Prince-ton\", \"Harvard\"],\n \"organizations\": [],\n \"locations\": [],\n \"dates\": [\"1970\", \"1800\"],\n \"document_type\": \"book\"\n}",
|
|
"{\n \"people\": [\"Prince-ton\", \"Harvard\"],\n \"organizations\": [\"National Center for Education Statistics\"],\n \"locations\": [],\n \"dates\": [\"1800\", \"1970\"],\n \"document_type\": \"book\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "87abf773_21",
|
|
"source": "GrasshopperPrimer_V3-3_EN.pdf",
|
|
"content_hash": "beae43ed",
|
|
"content_length": 2746,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
12.1,
|
|
3.0,
|
|
2.2
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [
|
|
"grasshopper"
|
|
],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "text"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [\"Grasshopper\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [\"Grasshopper\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"instruction\"\n}",
|
|
"{\n \"locations\": [\"Graph Mapper\", \"Dropdown List mode\"],\n \"document_type\": \"instruction manual\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "05812e17_18",
|
|
"source": "EXPERIENCE MACHINE _ how our minds predict and shape reality -- Andy Clark.pdf",
|
|
"content_hash": "ddabef58",
|
|
"content_length": 2920,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
9.8,
|
|
2.8,
|
|
2.0
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"andy clark"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "article"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"ANDY CLARK\"],\n \"document_type\": \"article\"\n}",
|
|
"{\n \"people\": [\"ANDY CLARK\"],\n \"dates\": [],\n \"organizations\": [],\n \"locations\": [],\n \"document_type\": \"text\"\n}",
|
|
"{\n \"people\": [\"ANDY CLARK\"],\n \"document_type\": \"text\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "f548556b_2",
|
|
"source": "AARON_NELSON-DIGITAL_HAPTIC_2020.pdf",
|
|
"content_hash": "aae21623",
|
|
"content_length": 2076,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
10.7,
|
|
2.9,
|
|
2.8
|
|
],
|
|
"extraction_sample": {
|
|
"people": [],
|
|
"organizations": [
|
|
"grasshopper",
|
|
"history of design"
|
|
],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "course_description"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [],\n \"organizations\": [\"Grasshopper\", \"History of Design\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"course_description\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [\"Grasshopper\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Course Outline\"\n}",
|
|
"{\n \"people\": [],\n \"organizations\": [\"Grasshopper\"],\n \"locations\": [],\n \"dates\": [],\n \"document_type\": \"Course Description\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "211f2199_13",
|
|
"source": "The E-myth revisited _ why most small businesses don't work -- Michael E_ Gerber.pdf",
|
|
"content_hash": "0356a33c",
|
|
"content_length": 2754,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.4,
|
|
1.7,
|
|
1.6
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"the fat guy",
|
|
"you"
|
|
],
|
|
"organizations": [],
|
|
"locations": [],
|
|
"dates": [],
|
|
"document_type": "story"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"You\", \"The Fat Guy\"],\n \"document_type\": \"story\"\n}",
|
|
"{\n \"people\": [\"You\", \"The Fat Guy\"],\n \"document_type\": \"fiction\"\n}",
|
|
"{\n \"people\": [\"You\", \"The Fat Guy\"],\n \"document_type\": \"story\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "cd3d1914_76",
|
|
"source": "The world beyond your head _ on becoming an individual in an -- Crawford, Matthew B.pdf",
|
|
"content_hash": "e9b45cb5",
|
|
"content_length": 2944,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
11.2,
|
|
3.3,
|
|
2.9
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"nicholas schiill"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"las vegas"
|
|
],
|
|
"dates": [],
|
|
"document_type": "book review"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"Nicholas Schiill\"],\n \"organizations\": [],\n \"locations\": [\"Las Vegas\"],\n \"dates\": [],\n \"document_type\": \"book review\"\n}",
|
|
"{\n \"people\": [\"Nick Yablonsky\", \"Schiill\"],\n \"organizations\": [],\n \"locations\": [\"Las Vegas\"],\n \"dates\": [],\n \"document_type\": \"book review\"\n}",
|
|
"{\n \"people\": [\"Schiill\"],\n \"organizations\": [],\n \"locations\": [\"Las Vegas\"],\n \"dates\": [],\n \"document_type\": \"book review\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "fc378df0_366",
|
|
"source": "ulysses.txt",
|
|
"content_hash": "293108da",
|
|
"content_length": 2798,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
15.6,
|
|
4.2,
|
|
4.1
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"bloom",
|
|
"j. j. o'molloy"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"the land of the pharaoh"
|
|
],
|
|
"dates": [],
|
|
"document_type": "dialogue"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"J. J. O'Molloy\", \"Bloom\"],\n \"organizations\": [],\n \"locations\": [\"the land of the Pharaoh\"],\n \"dates\": [],\n \"document_type\": \"dialogue\"\n}",
|
|
"{\n \"people\": [\"J. J. O'Molloy\", \"My client\", \"Bloom\"],\n \"organizations\": [],\n \"locations\": [\"the land of the Pharaoh\"],\n \"dates\": [],\n \"document_type\": \"legal-transcript\"\n}",
|
|
"{\n \"people\": [\"J. J. O'Molloy\", \"Bloom\"],\n \"organizations\": [],\n \"locations\": [\"the land of the Pharaoh\"],\n \"dates\": [],\n \"document_type\": \"legal_transcript\"\n}"
|
|
]
|
|
},
|
|
{
|
|
"id": "a230f2c3_488",
|
|
"source": "Landscape And Memory -- Simon Schama.pdf",
|
|
"content_hash": "4799c645",
|
|
"content_length": 2612,
|
|
"status": "INCONSISTENT",
|
|
"consistent": false,
|
|
"pass_times_seconds": [
|
|
15.1,
|
|
4.8,
|
|
5.2
|
|
],
|
|
"extraction_sample": {
|
|
"people": [
|
|
"john ruskin"
|
|
],
|
|
"organizations": [],
|
|
"locations": [
|
|
"arcadia",
|
|
"euphrates",
|
|
"london",
|
|
"reat mountains"
|
|
],
|
|
"dates": [
|
|
"1894",
|
|
"not specified"
|
|
],
|
|
"document_type": "book"
|
|
},
|
|
"raw_samples": [
|
|
"{\n \"people\": [\"John Ruskin\"],\n \"organizations\": [],\n \"locations\": [\"Reat Mountains\", \"Euphrates\", \"Arcadia\", \"London\"],\n \"dates\": [\"Not specified\", \"1894\"],\n \"document_type\": \"Book\"\n}",
|
|
"{\n \"people\": [\"John Ruskin\", \"Georgies\"],\n \"organizations\": [],\n \"locations\": [\"Reat Mountains\", \"deep Euphrates\", \"Arcaadia\", \"London\"],\n \"dates\": [\"Not specified\", \"1894\"],\n \"document_type\": \"b",
|
|
"{\n \"people\": [\"John Ruskin\", \"\"],\n \"organizations\": [\"Modern Painters\"],\n \"locations\": [\"reat mountains\", \"deep Euphrates\", \"Arcaedia\", \"London\", \"Parliament Hill\"],\n \"dates\": [\"not specified\", \"1"
|
|
]
|
|
}
|
|
],
|
|
"summary": {
|
|
"total": 50,
|
|
"consistent": 9,
|
|
"inconsistent": 41,
|
|
"failed": 0,
|
|
"timeout": 0,
|
|
"consistency_rate": 18.0,
|
|
"cascade_viable": false
|
|
}
|
|
} |