Files
gliner_glirel_tuning/nuextract_results.json
2026-05-04 23:44:11 +02:00

142 lines
14 KiB
JSON

{
"meta": {
"device": "cuda",
"dtype": "torch.bfloat16",
"model": "numind/NuExtract-2.0-2B"
},
"cpu_baseline": {
"T1_flat": {
"elapsed_s": 24.98,
"in_tok": 245,
"out_tok": 79
},
"T2_rich": {
"elapsed_s": 117.51,
"in_tok": 351,
"out_tok": 370
}
},
"T1_corp_short_flat": {
"elapsed_s": 2.88,
"n_input_tokens": 245,
"n_output_tokens": 79,
"raw_text": "{\"people\": [\"Pablo Isla\", \"Jose Maria Alvarez-Pallete\", \"Ignacio Galan\", \"Marina Serrano\", \"Carlos Torres\"], \"organizations\": [\"Telefonica\", \"Inditex\", \"Iberdrola\", \"Endesa\", \"BBVA\"], \"locations\": [\"Artixo, A Coruna\", \"Bilbao\"]}",
"parsed": {
"people": [
"Pablo Isla",
"Jose Maria Alvarez-Pallete",
"Ignacio Galan",
"Marina Serrano",
"Carlos Torres"
],
"organizations": [
"Telefonica",
"Inditex",
"Iberdrola",
"Endesa",
"BBVA"
],
"locations": [
"Artixo, A Coruna",
"Bilbao"
]
},
"input_chars": 658
},
"T2_corp_short_rich": {
"elapsed_s": 9.94,
"n_input_tokens": 351,
"n_output_tokens": 363,
"raw_text": "{\"organizations\": [{\"name\": \"Telefonica\", \"ceo\": \"Jose Maria Alvarez-Pallete\", \"chairman_president\": \"Jose Maria Alvarez-Pallete\", \"headquartered_in\": \"Madrid\", \"subsidiaries\": [], \"parent_company\": null}, {\"name\": \"Iberdrola\", \"ceo\": \"Ignacio Galan\", \"chairman_president\": null, \"headquartered_in\": \"Bilbao\", \"subsidiaries\": [], \"parent_company\": null}, {\"name\": \"Endesa\", \"ceo\": \"Marina Serrano\", \"chairman_president\": null, \"headquartered_in\": \"Bilbao\", \"subsidiaries\": [], \"parent_company\": null}, {\"name\": \"BBVA\", \"ceo\": \"Carlos Torres\", \"chairman_president\": null, \"headquartered_in\": \"Bilbao\", \"subsidiaries\": [], \"parent_company\": null}], \"people\": [{\"name\": \"Pablo Isla\", \"role\": \"Consejero\", \"organization\": \"Inditex\"}, {\"name\": \"Jose Maria Alvarez-Pallete\", \"role\": \"Presidente\", \"organization\": \"Telefonica\"}, {\"name\": \"Ignacio Galan\", \"role\": \"Presidente\", \"organization\": \"Iberdrola\"}, {\"name\": \"Marina Serrano\", \"role\": \"CEO\", \"organization\": \"Endesa\"}], \"agreements\": [{\"between\": [\"Telefonica\", \"Iberdrola\", \"Endesa\"], \"topic\": \"colaboracion en proyectos eolicos en Galicia\", \"amount\": \"2.000 millones de euros en cinco anos\"}]}",
"parsed": {
"between": [
"Telefonica",
"Iberdrola",
"Endesa"
],
"topic": "colaboracion en proyectos eolicos en Galicia",
"amount": "2.000 millones de euros en cinco anos"
},
"input_chars": 658
},
"T3_long_text_rich": {
"elapsed_s": 53.56,
"n_input_tokens": 952,
"n_output_tokens": 2048,
"raw_text": "{\"organizations\": [{\"name\": \"BBVA\", \"ceo\": \"Carlos Torres\", \"chairman_president\": \"Carlos Torres\", \"headquartered_in\": \"Bilbao\", \"subsidiaries\": [\"Banco Sabadell\"], \"parent_company\": \"BBVA\"}, {\"name\": \"Banco Santander\", \"ceo\": \"Ana Botin\", \"chairman_president\": \"Ana Botin\", \"headquartered_in\": \"Valencia\", \"subsidiaries\": [\"CaixaBank\", \"Bankia\"], \"parent_company\": \"Banco Santander\"}, {\"name\": \"CaixaBank\", \"ceo\": \"Hector Grisi\", \"chairman_president\": \"Hector Grisi\", \"headquartered_in\": \"Valencia\", \"subsidiaries\": [\"Bankia\"], \"parent_company\": \"CaixaBank\"}, {\"name\": \"Banco de Espana\", \"ceo\": \"Pablo Hernandez de Cos\", \"chairman_president\": \"Pablo Hernandez de Cos\", \"headquartered_in\": null, \"subsidiaries\": [], \"parent_company\": \"Banco de Espana\"}, {\"name\": \"La Comision Nacional del Mercado de Valores\", \"ceo\": \"Rodrigo Buenaventura\", \"chairman_president\": \"Rodrigo Buenaventura\", \"headquartered_in\": null, \"subsidiaries\": [], \"parent_company\": null}, {\"name\": \"Telefonica\", \"ceo\": \"Jose Maria Alvarez-Pallete\", \"chairman_president\": \"Jose Maria Alvarez-Pallete\", \"headquartered_in\": null, \"subsidiaries\": [], \"parent_company\": \"Telefonica\"}, {\"name\": \"Saudi Telecom Company\", \"ceo\": \"Andy Jassy\", \"chairman_president\": \"Andy Jassy\", \"headquartered_in\": null, \"subsidiaries\": [], \"parent_company\": \"Saudi Telecom Company\"}, {\"name\": \"Recurso Humanos del Grupo Mapfre\", \"ceo\": \"Cristina Aldamiz-Echevarria\", \"chairman_president\": \"Cristina Aldamiz-Echevarria\", \"headquartered_in\": null, \"subsidiaries\": [], \"parent_company\": \"Grupo Mapfre\"}], \"people\": [{\"name\": \"Carlos Torres\", \"role\": \"presidente\", \"organization\": \"BBVA\"}, {\"name\": \"Onur Genc\", \"role\": \"consejero delegado\", \"organization\": \"Banco Sabadell\"}, {\"name\": \"Josep Oliu\", \"role\": \"presidente\", \"organization\": \"Sabadell\"}, {\"name\": \"Josep Oliu\", \"role\": \"presidente\", \"organization\": \"Sabadell\"}, {\"name\": \"Josu Jon Imaz\", \"role\": \"CEO\", \"organization\": \"Repsol\"}, {\"name\": \"Antonio Brufau\", \"role\": \"presidente\", \"organization\": \"Repsol\"}, {\"name\": \"Josu Jon Imaz\", \"role\": \"CEO\", \"organization\": \"Repsol\"}, {\"name\": \"Antonio Brufau\", \"role\": \"presidente\", \"organization\": \"Repsol\"}, {\"name\": \"Josu Jon Imaz\", \"role\": \"CEO\", \"organization\": \"Repsol\"}, {\"name\": \"Ignacio Galan\", \"role\": \"CEO\", \"organization\": \"Iberdrola\"}, {\"name\": \"Andy Jassy\", \"role\": \"CEO\", \"organization\": \"Amazon\"}, {\"name\": \"Marina Serrano\", \"role\": \"CEO\", \"organization\": \"Endesa\"}, {\"name\": \"Florentino Perez\", \"role\": \"presidente\", \"organization\": \"ACS\"}, {\"name\": \"Rafael del Pino\", \"role\": \"presidente\", \"organization\": \"Ferrovial\"}, {\"name\": \"Pablo Isla\", \"role\": \"expresidente de Inditex\", \"organization\": \"Inditex\"}, {\"name\": \"Jose Maria Alvarez-Pallete\", \"role\": \"presidente\", \"organization\": \"Telefonica\"}, {\"name\": \"Cristina Aldamiz-Echevarria\", \"role\": \"directora de Recursos Humanos\", \"organization\": \"Grupo Mapfre\"}, {\"name\": \"Francisco Reynes\", \"role\": \"presidente\", \"organization\": \"Naturgy\"}, {\"name\": \"Marc Murtra\", \"role\": \"presidente\", \"organization\": \"Indra\"}, {\"name\": \"Margarita Robles\", \"role\": \"presidente\", \"organization\": \"Indra\"}, {\"name\": \"Antonio Huertas\", \"role\": \"directora de Recursos Humanos\", \"organization\": \"Grupo Mapfre\"}], \"agreements\": [{\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"integracion operativa\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA hostil\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"independencia del banco\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"contrato a Iberdrola\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"entrada del estado en su capital\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"topic\": \"OPA parcial\", \"amount\": null}, {\"between\": [\"BBVA\", \"Sabadell\"], \"",
"parsed": null,
"input_chars": 2722
},
"pdf_meta": {
"n_chunks": 97,
"clean_chars": 88714
},
"T4_pdf_chunks": [
{
"chunk_idx": 0,
"elapsed_s": 2.84,
"n_input_tokens": 581,
"n_output_tokens": 115,
"raw_text": "{\"data_controller\": {\"name\": \"Banco Bilbao Vizcaya Argentaria, S.A.\", \"address\": \"Plaza de San Nicolás 4, 48005 Bilbao, España\", \"registration\": \"C.I.F. A-48265169\"}, \"dpo_contact\": {\"email\": \"consultasgenerales@bbva.com\", \"address\": null}, \"data_categories\": [], \"rights_listed\": [], \"authorities_mentioned\": [], \"laws_mentioned\": []}",
"parsed": {
"email": "consultasgenerales@bbva.com",
"address": null
},
"input_chars": 1448
},
{
"chunk_idx": 5,
"elapsed_s": 4.03,
"n_input_tokens": 559,
"n_output_tokens": 160,
"raw_text": "{\"data_controller\": {\"name\": \"Banco Bilbao Vizcaya Argentaria, S.A.\", \"address\": \"Plaza San Nicolás, 4, 48005 Bilbao, España\", \"registration\": \"C.I.F. A-48265169\"}, \"dpo_contact\": {\"email\": \"consultasgenerales@bbva.com\", \"address\": \"Plaza de San Nicolás 4, 48005, Bilbao, España\"}, \"data_categories\": [\"Datos identificativos y de contacto\", \"Información sobre productos y servicios\", \"Información sobre servicios de comercio\"], \"rights_listed\": [], \"authorities_mentioned\": [], \"laws_mentioned\": []}",
"parsed": {
"email": "consultasgenerales@bbva.com",
"address": "Plaza de San Nicolás 4, 48005, Bilbao, España"
},
"input_chars": 1483
},
{
"chunk_idx": 15,
"elapsed_s": 4.69,
"n_input_tokens": 530,
"n_output_tokens": 184,
"raw_text": "{\"data_controller\": {\"name\": null, \"address\": null, \"registration\": null}, \"dpo_contact\": {\"email\": null, \"address\": null}, \"data_categories\": [\"Datos de firma (incluida la firma digitalizada y electrónica)\", \"Datos económicos y de solvencia patrimonial\", \"Datos sociodemográficos\", \"Datos obtenidos de otras fuentes\", \"Información de solvencia de la Central de Información de Riesgos del Banco de España (CIRBE)\", \"Información obtenida de los sistemas de información crediticia\", \"Datos de otros productos en los que participes como garante\", \"Datos de firma (incluida la firma digitalizada y electrónica)\", \"Datos de productos y servicios en los que intervengas\"], \"rights_listed\": [], \"authorities_mentioned\": [], \"laws_mentioned\": []}",
"parsed": {
"email": null,
"address": null
},
"input_chars": 1487
},
{
"chunk_idx": 30,
"elapsed_s": 2.67,
"n_input_tokens": 528,
"n_output_tokens": 106,
"raw_text": "{\"data_controller\": {\"name\": \"Confirma Sistemas de Información, S.L.\", \"address\": \"Avda. de la Industria, 18, TRES CANTOS (28760) MADRID\", \"registration\": null}, \"dpo_contact\": {\"email\": \"dpogrupobbva@bbva.com\", \"address\": null}, \"data_categories\": [], \"rights_listed\": [], \"authorities_mentioned\": [], \"laws_mentioned\": []}",
"parsed": {
"email": "dpogrupobbva@bbva.com",
"address": null
},
"input_chars": 1491
},
{
"chunk_idx": 60,
"elapsed_s": 1.77,
"n_input_tokens": 500,
"n_output_tokens": 71,
"raw_text": "{\"data_controller\": {\"name\": null, \"address\": null, \"registration\": null}, \"dpo_contact\": {\"email\": null, \"address\": null}, \"data_categories\": [], \"rights_listed\": [\"derecho fundamental a la protección de datos personales\"], \"authorities_mentioned\": [], \"laws_mentioned\": []}",
"parsed": {
"email": null,
"address": null
},
"input_chars": 1409
}
],
"full_pdf_extrapolation": {
"avg_per_chunk_s": 3.2,
"n_chunks": 97,
"estimated_total_s": 310.4,
"estimated_total_min": 5.2
}
}