feat: stage2/3 pipeline, taxonomy-free cascade, E1.8/E4 experiments, corpus migration state

This commit is contained in:
2026-04-30 04:04:31 +00:00
parent 62b5b5453a
commit 2b9a1782c1
14 changed files with 6145 additions and 5 deletions
+909
View File
@@ -0,0 +1,909 @@
{
"subsample_a": [
{
"name": "Claude: Lubbock on everything album lyrics",
"bucket": "high",
"taxfree_metadata": {
"active_frames": [
"Songwriting",
"Storytelling",
"Literary Analysis"
],
"frame_relationships": "The Songwriting frame is the primary focus of this content, with the Storytelling and Literary Analysis frames providing context and analysis for understanding Terry Allen's writing style.",
"extraction_orientation": "Look for specific elements of Allen's writing style as outlined by Claude, including conversational deadpan, specificity as worldbuilding, humor next to heartbreak, the 'report from the inside' voice, short, punchy, declarative sentences, and characters as shorthand for the place.",
"one_sentence_summary": "A discussion about Terry Allen's album Lubbock (on Everything) and its writing style, with guidance on how to emulate it for a creative project"
},
"taxfree_orientation": "Active frames: Songwriting, Storytelling, Literary Analysis. Frame relationships: The Songwriting frame is the primary focus of this content, with the Storytelling and Literary Analysis frames providing context and analysis for understanding Terry Allen's writing style. Extraction focus: Look for specific elements of Allen's writing style as outlined by Claude, including conversational deadpan, specificity as worldbuilding, humor next to heartbreak, the 'report from the inside' voice, short, punchy, declarative sentences, and characters as shorthand for the place. Summary: A discussion about Terry Allen's album Lubbock (on Everything) and its writing style, with guidance on how to emulate it for a creative project",
"e14_prod_preds": 11,
"e14_cascade_preds": 4,
"e14_delta_preds": -7,
"e14_prod_edges": 17,
"e14_cascade_edges": 5,
"e14_delta_edges": -12
},
{
"name": "ChatGPT: Tulsa Concept Album Guide",
"bucket": "high",
"taxfree_metadata": {
"active_frames": [
"Personal_Narrative",
"Place_Exploration",
"Autobiography"
],
"frame_relationships": "The Personal_Narrative and Place_Exploration frames are intertwined, with the album being a personal account of the writer's experiences in Tulsa. The Autobiography frame is used to disguise the concept album as a traditional autobiography.",
"extraction_orientation": "The most relationship-rich content can be found in the vignettes and track descriptions, as they provide insights into the writer's personal experiences, emotions, and perceptions of Tulsa.",
"one_sentence_summary": "The document describes a planned concept album about the writer's personal experiences growing up in Tulsa, Oklahoma, inspired by Terry Allen's *Lubbock (on Everything)*, with a focus on exploring themes related to race, religion, nostalgia, and departure."
},
"taxfree_orientation": "Active frames: Personal_Narrative, Place_Exploration, Autobiography. Frame relationships: The Personal_Narrative and Place_Exploration frames are intertwined, with the album being a personal account of the writer's experiences in Tulsa. The Autobiography frame is used to disguise the concept album as a traditional autobiography. Extraction focus: The most relationship-rich content can be found in the vignettes and track descriptions, as they provide insights into the writer's personal experiences, emotions, and perceptions of Tulsa. Summary: The document describes a planned concept album about the writer's personal experiences growing up in Tulsa, Oklahoma, inspired by Terry Allen's *Lubbock (on Everything)*, with a focus on exploring themes related to race, religion, nostalgia, and departure.",
"e14_prod_preds": 10,
"e14_cascade_preds": 4,
"e14_delta_preds": -6,
"e14_prod_edges": 19,
"e14_cascade_edges": 16,
"e14_delta_edges": -3
},
{
"name": "ChatGPT: Rhino 3D object flow",
"bucket": "high",
"taxfree_metadata": {
"active_frames": [
"Digital Fabrication",
"Philosophical Concepts",
"Design Process"
],
"frame_relationships": "The philosophical concepts provide a framework for understanding and describing digital fabrication processes.",
"extraction_orientation": "Focus on the mapping between the philosophical concepts and the digital fabrication processes",
"one_sentence_summary": "Discussion about how Deleuze's ideas map onto digital fabrication processes in architecture, design, and fabrication labs"
},
"taxfree_orientation": "Active frames: Digital Fabrication, Philosophical Concepts, Design Process. Frame relationships: The philosophical concepts provide a framework for understanding and describing digital fabrication processes. Extraction focus: Focus on the mapping between the philosophical concepts and the digital fabrication processes Summary: Discussion about how Deleuze's ideas map onto digital fabrication processes in architecture, design, and fabrication labs",
"e14_prod_preds": 16,
"e14_cascade_preds": 11,
"e14_delta_preds": -5,
"e14_prod_edges": 31,
"e14_cascade_edges": 28,
"e14_delta_edges": -3
},
{
"name": "Claude: SUNY faculty conflict of interest policies",
"bucket": "mid",
"taxfree_metadata": {
"active_frames": [
"Educational Policy",
"Workplace Ethics",
"Conflict of Interest",
"Academia-Industry Collaboration"
],
"frame_relationships": "The document primarily discusses the SUNY conflict of interest policy for faculty members, focusing on outside work and consulting. The system-level policy and specific campus handbooks are provided as resources.",
"extraction_orientation": "Look for details about the nature of the consulting firm, its relationship with the academic work, and compliance with state ethics laws and SUNY policies.",
"one_sentence_summary": "This document outlines SUNY conflict of interest policies for faculty members engaging in outside work or consulting."
},
"taxfree_orientation": "Active frames: Educational Policy, Workplace Ethics, Conflict of Interest, Academia-Industry Collaboration. Frame relationships: The document primarily discusses the SUNY conflict of interest policy for faculty members, focusing on outside work and consulting. The system-level policy and specific campus handbooks are provided as resources. Extraction focus: Look for details about the nature of the consulting firm, its relationship with the academic work, and compliance with state ethics laws and SUNY policies. Summary: This document outlines SUNY conflict of interest policies for faculty members engaging in outside work or consulting.",
"e14_prod_preds": 7,
"e14_cascade_preds": 3,
"e14_delta_preds": -4,
"e14_prod_edges": 10,
"e14_cascade_edges": 3,
"e14_delta_edges": -7
},
{
"name": "Claude: Interview presentation research and preparation",
"bucket": "mid",
"taxfree_metadata": {
"active_frames": [
"Digital-Physical Interface",
"Emerging Technologies"
],
"frame_relationships": "The Digital-Physical Interface frame centers the workflow between digital models and physical objects, while Emerging Technologies highlights the specific tools (AI, XR) used in this workflow.",
"extraction_orientation": "Look for instances where the workflow between digital models and physical objects is described, as well as mentions of AI or XR technologies being used in this context.",
"one_sentence_summary": "A discussion on the intersection of AI and XR in a design project, focusing on the digital-physical workflow and its implications for teaching."
},
"taxfree_orientation": "Active frames: Digital-Physical Interface, Emerging Technologies. Frame relationships: The Digital-Physical Interface frame centers the workflow between digital models and physical objects, while Emerging Technologies highlights the specific tools (AI, XR) used in this workflow. Extraction focus: Look for instances where the workflow between digital models and physical objects is described, as well as mentions of AI or XR technologies being used in this context. Summary: A discussion on the intersection of AI and XR in a design project, focusing on the digital-physical workflow and its implications for teaching.",
"e14_prod_preds": 9,
"e14_cascade_preds": 5,
"e14_delta_preds": -4,
"e14_prod_edges": 10,
"e14_cascade_edges": 10,
"e14_delta_edges": 0
},
{
"name": "ChatGPT: Respect Individual Interests for Christmas",
"bucket": "low",
"taxfree_metadata": {
"active_frames": [
"Gift Giving",
"Interests and Preferences",
"Holiday Season"
],
"frame_relationships": "The frames of gift giving and interests/preferences are intertwined as the document discusses choosing gifts based on a recipient's unique hobbies and preferences during the holiday season.",
"extraction_orientation": "Focus on relational content that describes how specific gifts align with an individual's interests or preferences, and consider the context of the holiday season.",
"one_sentence_summary": "The document provides advice on choosing Christmas gifts based on an individual's unique interests and preferences."
},
"taxfree_orientation": "Active frames: Gift Giving, Interests and Preferences, Holiday Season. Frame relationships: The frames of gift giving and interests/preferences are intertwined as the document discusses choosing gifts based on a recipient's unique hobbies and preferences during the holiday season. Extraction focus: Focus on relational content that describes how specific gifts align with an individual's interests or preferences, and consider the context of the holiday season. Summary: The document provides advice on choosing Christmas gifts based on an individual's unique interests and preferences.",
"e14_prod_preds": 3,
"e14_cascade_preds": 1,
"e14_delta_preds": -2,
"e14_prod_edges": 3,
"e14_cascade_edges": 1,
"e14_delta_edges": -2
},
{
"name": "University of North Texas Cover letter.pdf",
"bucket": "document",
"taxfree_metadata": {
"active_frames": [
"Education",
"Job Application",
"Artwork Creation",
"Academia"
],
"frame_relationships": "The 'Education' and 'Job Application' frames are the primary drivers of the document, with 'Artwork Creation' providing contextual details. The 'Academia' frame serves as a broader context for all other frames.",
"extraction_orientation": "Focus on relations between the applicant's educational background, job application, and artworks to understand their qualifications and fit for the position.",
"one_sentence_summary": "This document details an artist's application for a Senior Lecturer position in Computing in the Visual Arts at University of North Texas, highlighting their educational background, teaching experience, and artistic practice."
},
"taxfree_orientation": "Active frames: Education, Job Application, Artwork Creation, Academia. Frame relationships: The 'Education' and 'Job Application' frames are the primary drivers of the document, with 'Artwork Creation' providing contextual details. The 'Academia' frame serves as a broader context for all other frames. Extraction focus: Focus on relations between the applicant's educational background, job application, and artworks to understand their qualifications and fit for the position. Summary: This document details an artist's application for a Senior Lecturer position in Computing in the Visual Arts at University of North Texas, highlighting their educational background, teaching experience, and artistic practice.",
"e14_prod_preds": 10,
"e14_cascade_preds": 8,
"e14_delta_preds": -2,
"e14_prod_edges": 13,
"e14_cascade_edges": 12,
"e14_delta_edges": -1
},
{
"name": "Claude: Finding ideal rural housing near University of Utah",
"bucket": "high",
"taxfree_metadata": {
"active_frames": [
"Geography",
"Community",
"Housing",
"Transportation"
],
"frame_relationships": "The geographical location and community characteristics inform the housing and transportation options in each area.",
"extraction_orientation": "Focus on the specific details about Morgan, Kamas Valley, and Heber City/Midway regarding their character, housing, commute specifics to U of U, demographics, and vegetation.",
"one_sentence_summary": "Document discusses potential rural living situations near University of Utah, comparing Morgan, Kamas Valley (Oakley, Kamas, Francis), and Heber City/Midway in terms of geography, community, housing, transportation, and demographics."
},
"taxfree_orientation": "Active frames: Geography, Community, Housing, Transportation. Frame relationships: The geographical location and community characteristics inform the housing and transportation options in each area. Extraction focus: Focus on the specific details about Morgan, Kamas Valley, and Heber City/Midway regarding their character, housing, commute specifics to U of U, demographics, and vegetation. Summary: Document discusses potential rural living situations near University of Utah, comparing Morgan, Kamas Valley (Oakley, Kamas, Francis), and Heber City/Midway in terms of geography, community, housing, transportation, and demographics.",
"e14_prod_preds": 14,
"e14_cascade_preds": 13,
"e14_delta_preds": -1,
"e14_prod_edges": 28,
"e14_cascade_edges": 30,
"e14_delta_edges": 2
},
{
"name": "ChatGPT: SEC coaches with OSU ties",
"bucket": "high",
"taxfree_metadata": {
"error": {
"message": "An error occurred",
"details": [
{
"title": "OEmbed request error",
"url": "https://api.twitter.com/1.1/oembed?url=https%3A%2F%2Fmobile.twitter.com%2Fstatus%2F1657087050422960128",
"message": "Failed to load external media.\nThis is likely not a stable URL for an oEmbed."
}
]
}
},
"taxfree_orientation": "Active frames: . Frame relationships: Extraction focus: Summary: ",
"e14_prod_preds": 5,
"e14_cascade_preds": 4,
"e14_delta_preds": -1,
"e14_prod_edges": 25,
"e14_cascade_edges": 24,
"e14_delta_edges": -1
},
{
"name": "Claude: Bonding ASA 3D printed parts",
"bucket": "mid",
"taxfree_metadata": {
"active_frames": [
"Bonding",
"Material_Selection",
"3D_Printed_Parts",
"Adhesives"
],
"frame_relationships": "The frames 'Bonding' and 'Material_Selection' are active, with the latter providing context for the former by discussing suitable adhesives for bonding 3D printed parts.",
"extraction_orientation": "Focus on the properties, application areas, and relative strength of the discussed adhesives in relation to ASA 3D printed parts.",
"one_sentence_summary": "This document provides recommendations on various adhesives for bonding ASA 3D printed parts."
},
"taxfree_orientation": "Active frames: Bonding, Material_Selection, 3D_Printed_Parts, Adhesives. Frame relationships: The frames 'Bonding' and 'Material_Selection' are active, with the latter providing context for the former by discussing suitable adhesives for bonding 3D printed parts. Extraction focus: Focus on the properties, application areas, and relative strength of the discussed adhesives in relation to ASA 3D printed parts. Summary: This document provides recommendations on various adhesives for bonding ASA 3D printed parts.",
"e14_prod_preds": 5,
"e14_cascade_preds": 4,
"e14_delta_preds": -1,
"e14_prod_edges": 10,
"e14_cascade_edges": 11,
"e14_delta_edges": 1
},
{
"name": "ChatGPT: Title: User request summary.",
"bucket": "low",
"taxfree_metadata": {
"active_frames": [
"Event",
"Speech",
"Hosting",
"Communication"
],
"frame_relationships": "The 'Event' frame is the main context, within which the 'Speech', 'Hosting', and 'Communication' frames are active.",
"extraction_orientation": "Look for the relationships between the host, the event, and the speech content in the introductory text of the document.",
"one_sentence_summary": "The document revolves around a conversation about creating an introductory speech for a design week event."
},
"taxfree_orientation": "Active frames: Event, Speech, Hosting, Communication. Frame relationships: The 'Event' frame is the main context, within which the 'Speech', 'Hosting', and 'Communication' frames are active. Extraction focus: Look for the relationships between the host, the event, and the speech content in the introductory text of the document. Summary: The document revolves around a conversation about creating an introductory speech for a design week event.",
"e14_prod_preds": 3,
"e14_cascade_preds": 2,
"e14_delta_preds": -1,
"e14_prod_edges": 3,
"e14_cascade_edges": 2,
"e14_delta_edges": -1
},
{
"name": "ChatGPT: Scholarship Recommendation Letter Tips",
"bucket": "low",
"taxfree_metadata": {
"active_frames": [
"Recommendation",
"Education",
"Professional Skills",
"Personal Characteristics",
"Achievements",
"Future Potential"
],
"frame_relationships": "The frames interact to provide a comprehensive assessment of the candidate's qualifications for a scholarship, focusing on both their academic and personal qualities.",
"extraction_orientation": "Relational content to focus on includes relationships between the recommender and applicant, the applicant's achievements, contributions, and potential, as well as examples supporting the description of personal traits.",
"one_sentence_summary": "This document outlines guidelines for writing a scholarship recommendation letter, covering key areas such as introduction, purpose, academic and professional qualities, personal characteristics, achievements, future potential, conclusion, and letter formatting."
},
"taxfree_orientation": "Active frames: Recommendation, Education, Professional Skills, Personal Characteristics, Achievements, Future Potential. Frame relationships: The frames interact to provide a comprehensive assessment of the candidate's qualifications for a scholarship, focusing on both their academic and personal qualities. Extraction focus: Relational content to focus on includes relationships between the recommender and applicant, the applicant's achievements, contributions, and potential, as well as examples supporting the description of personal traits. Summary: This document outlines guidelines for writing a scholarship recommendation letter, covering key areas such as introduction, purpose, academic and professional qualities, personal characteristics, achievements, future potential, conclusion, and letter formatting.",
"e14_prod_preds": 2,
"e14_cascade_preds": 1,
"e14_delta_preds": -1,
"e14_prod_edges": 2,
"e14_cascade_edges": 1,
"e14_delta_edges": -1
}
],
"subsample_b": [
{
"name": "ChatGPT: Job application comparison",
"bucket": "high",
"taxfree_metadata": {
"active_frames": [
"Job Application",
"Education & Qualifications Comparison",
"School Leadership Profile",
"Arts Education & Facilities Management"
],
"frame_relationships": "The frames interact by comparing the applicant's qualifications to the job requirements, peer deans' profiles, and the mission of the School of the Arts at Western.",
"extraction_orientation": "Relational content a knowledge graph extractor should look for includes comparisons between the applicant's profile and job requirements, peer dean profiles, and the School of the Arts at Western's mission.",
"one_sentence_summary": "This document discusses a job application for a Dean position in the new School of the Arts at Western, comparing the applicant's qualifications to job requirements and peer deans' profiles while emphasizing their fit with the School's mission."
},
"standard_metadata": {
"language": "en",
"char_length": 1569,
"primary_format": "prose",
"structural_signals": {
"has_headings": true,
"has_bullet_lists": true,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": true
},
"content_signals": {
"has_named_people": true,
"has_institutional_language": true,
"has_technical_terminology": true,
"has_first_person": true,
"has_quotations": false
},
"domain_class": "educational",
"one_sentence_summary": "Discussion about a job application for the dean position at Western's School of the Arts, comparing it to other similar schools and analyzing the applicant's qualifications."
}
},
{
"name": "ChatGPT: External review for tenure",
"bucket": "high",
"taxfree_metadata": {
"active_frames": [
"Tenure Review",
"Academic Evaluation",
"Peer Review"
],
"frame_relationships": "The Tenure Review frame is the central and overarching context in which the other frames (Academic Evaluation, Peer Review) are activated.",
"extraction_orientation": "Focus on the specific criteria, standards, and expectations related to tenure review, as well as the evaluation process itself.",
"one_sentence_summary": "This document provides guidelines for an external evaluator in a tenure review process, detailing what materials to expect, how to structure the evaluation letter, and what aspects to consider in assessing research/creative activity, teaching, service, and overall recommendation."
},
"standard_metadata": {
"language": "en",
"char_length": 1963,
"primary_format": "prose",
"structural_signals": {
"has_headings": true,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": true
},
"content_signals": {
"has_named_people": true,
"has_institutional_language": true,
"has_technical_terminology": true,
"has_first_person": true,
"has_quotations": false
},
"domain_class": "educational",
"one_sentence_summary": "This document provides guidelines for an external reviewer to evaluate a faculty member's record for tenure."
}
},
{
"name": "Claude: University of Utah interview teaching example",
"bucket": "high",
"taxfree_metadata": {
"active_frames": [
"Education",
"Teaching",
"Computational Design",
"Programming for Arts",
"3D Printing"
],
"frame_relationships": "The document discusses a university course, its curriculum, and related projects; these topics are interconnected as they all revolve around the teaching of computational design in a university setting.",
"extraction_orientation": "Look for relationships between the course content, its objectives, and practical applications, including programming languages used, projects undertaken, and equipment utilized.",
"one_sentence_summary": "The document describes a university course offering on computational design for arts, covering topics such as programming in Processing/Java, 3D printing, advanced slicer techniques, Stratasys equipment usage, and certification options."
},
"standard_metadata": {
"language": "en",
"char_length": 1624,
"primary_format": "prose",
"structural_signals": {
"has_headings": true,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": false
},
"content_signals": {
"has_named_people": true,
"has_institutional_language": false,
"has_technical_terminology": true,
"has_first_person": true,
"has_quotations": false
},
"domain_class": "educational",
"one_sentence_summary": "Discussion about a course teaching computational techniques for 3D design at the University of Utah"
}
},
{
"name": "ChatGPT: Starting Dropship Gun Business",
"bucket": "high",
"taxfree_metadata": {
"active_frames": [
"GunBusinessSetup",
"FFLCompliance",
"DistributorRelationshipBuilding",
"Ecommerce"
],
"frame_relationships": "The 'GunBusinessSetup' frame involves navigating multiple layers of compliance (FFL, zoning, and state/local laws) while building relationships with distributors and setting up an e-commerce platform.",
"extraction_orientation": "Focus on the detailed workflows for obtaining FFL, setting up compliant e-commerce store, finding a distributor, and establishing B2B credit relationship with them.",
"one_sentence_summary": "A guide detailing how to start a dropship gun business in the US, including the legal requirements, necessary setup steps, and tips for building relationships with distributors."
},
"standard_metadata": {
"language": "en",
"char_length": 2764,
"primary_format": "prose",
"structural_signals": {
"has_headings": true,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": false
},
"content_signals": {
"has_named_people": true,
"has_institutional_language": true,
"has_technical_terminology": true,
"has_first_person": true,
"has_quotations": false
},
"domain_class": "educational",
"one_sentence_summary": "This document provides a detailed guide on how to set up a dropship gun business in the U.S., covering licensing, setting up compliant premises, understanding regulations, dealing with payments and e-commerce platforms, and building relationships with distributors."
}
},
{
"name": "ChatGPT: Analyze business plan",
"bucket": "high",
"taxfree_metadata": {},
"standard_metadata": {
"assistant_name": "aaron",
"role": "assistant",
"version": "7.1.0-alpha",
"name": "Business Plan Analysis - Employees and Contractors Only",
"messages": [
{
"role": "system",
"content": "Here's an analysis of the business plan focusing only on the employees and contractors expenses, comparing them to the provided OpEx bands."
},
{
"role": "assistant",
"content": "First, let me load the data from the excel file and format the columns.\n\nimport pandas as pd\nimport numpy as np\nimport matplotlib.pyplot as plt\nfrom caas_jupyter_tools import display_dataframe_to_user\npath = '/mnt/data/EAS Staffing.xlsx'\ndf = pd.read_excel(path, header=9)\ndf = df.dropna(axis=1, how='all')\ndf.columns = [str(c).strip().lower().replace('\n',' ').replace(' ', '_') for c in df.columns]\n"
},
{
"role": "assistant",
"content": "Next, let's identify the month columns and fill any missing values with 0.\n\nmonth_cols = [c for c in df.columns if c.startswith('m') and c[1:].lstrip('-').isdigit()]\nmonth_cols = [c for c in month_cols if int(c[1:]) >= 0]\nmonth_cols = sorted(month_cols, key=lambda c: int(c[1:]))\nfor c in month_cols:\ndf[c] = pd.to_numeric(df[c], errors='coerce').fillna(0)"
},
{
"role": "assistant",
"content": "Now, let's filter the data to only include employees and contractors (exclude subtotals/notes).\n\nmask_emp_con = df['type'].astype(str).str.lower().str.contains('employee|contract', na=False)\nempcon = df.loc[mask_emp_con].copy()"
},
{
"role": "assistant",
"content": "Next, let's compute the total staffing costs for each month.\n\ntotals = pd.DataFrame({ 'MonthIndex': [int(c[1:]) for c in month_cols], 'Staffing_Total': [empcon[c].sum() for c in month_cols] })\n"
},
{
"role": "assistant",
"content": "Now, let's define the years 1 and 2 masks based on the total index.\ny1 = totals['MonthIndex'] <= 11\ny2 = (totals['MonthIndex'] >= 12) & (totals['MonthIndex'] <= 23)"
},
{
"role": "assistant",
"content": "Finally, let's compare the total staffing costs to the provided OpEx bands for years 1 and 2.\n\nYear 1 (M1 - M11): Staffing_Total: $"
},
{
"role": "assistant",
"content": "\tSum(totals.loc[y1, 'Staffing_Total']): ${:,.0f}\n\nYear 2 (M12 - M24): Staffing_Total: $"
},
{
"role": "assistant",
"content": "\tSum(totals.loc[y2, 'Staffing_Total']): ${:,.0f}"
}
]
}
},
{
"name": "ChatGPT: Outdoor Layering Explained",
"bucket": "mid",
"taxfree_metadata": {
"active_frames": [
"Clothing Layering",
"Outdoor Clothing",
"Sweat Management",
"Insulation",
"Protection",
"Weather"
],
"frame_relationships": "The frames interact by defining layers in an outdoor clothing system for managing sweat, insulation, and protection from weather conditions.",
"extraction_orientation": "Focus on the relationships between layers and how they are mixed-and-matched depending on temperature, wind, precipitation, and activity level.",
"one_sentence_summary": "The document describes a 3-layer outdoor clothing system for managing sweat, insulation, and protection from wind, rain, and snow during various activities."
},
"standard_metadata": {
"language": "en",
"char_length": 3761,
"primary_format": "prose",
"structural_signals": {
"has_headings": true,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": false
},
"content_signals": {
"has_named_people": true,
"has_institutional_language": false,
"has_technical_terminology": true,
"has_first_person": true,
"has_quotations": false
},
"domain_class": "educational",
"one_sentence_summary": "The document explains the concept of layering outdoor clothing for different activities and weather conditions, including base layer, mid-layer, and outer layer, as well as hand and leg layers."
}
},
{
"name": "ChatGPT: Limits in Calculus.",
"bucket": "mid",
"taxfree_metadata": {
"active_frames": [
"Mathematics",
"Calculus",
"Functions",
"Limits"
],
"frame_relationships": "The 'Mathematics' and 'Calculus' frames are active. The 'Functions', 'Limits', and 'Calculus' frames are interconnected, as the document discusses the concept of limits in relation to functions within calculus.",
"extraction_orientation": "Look for relational content between functions, their inputs, and the behavior of those functions as they approach certain values (limits).",
"one_sentence_summary": "The document explains the concept of limits in calculus and provides real-world examples to illustrate its use."
},
"standard_metadata": {
"language": "en",
"char_length": 1269,
"primary_format": "prose",
"structural_signals": {
"has_headings": false,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": true
},
"content_signals": {
"has_named_people": false,
"has_institutional_language": false,
"has_technical_terminology": true,
"has_first_person": false,
"has_quotations": false
},
"domain_class": "educational",
"one_sentence_summary": "Discussion on the concept of limits in calculus and their real-world applications"
}
},
{
"name": "ChatGPT: Academic Program Director Role",
"bucket": "mid",
"taxfree_metadata": {
"active_frames": [
"academic_program",
"administration",
"faculty_management",
"student_engagement",
"curriculum_development"
],
"frame_relationships": "The 'academic program' frame underpins the entire document, with 'administration', 'faculty management', and 'student engagement' frames supporting it. The 'curriculum development' frame is a core function that intersects all other frames.",
"extraction_orientation": "Look for relationships between roles (e.g., program director to faculty, students, administration), responsibilities within each role, and interactions between these responsibilities",
"one_sentence_summary": "This document outlines the key duties of an academic program director in Design and Digital Fabrication programs, focusing on managing faculty, engaging with industry partners, developing curriculum, assessing student outcomes, and fostering student success."
},
"standard_metadata": {
"language": "en",
"char_length": 4507,
"primary_format": "prose",
"structural_signals": {
"has_headings": true,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": false
},
"content_signals": {
"has_named_people": true,
"has_institutional_language": true,
"has_technical_terminology": true,
"has_first_person": true,
"has_quotations": false
},
"domain_class": "educational",
"one_sentence_summary": "Document describes the role and responsibilities of an Academic Program Director for Design and Digital Fabrication programs"
}
},
{
"name": "ChatGPT: Lonely Island Poop Skit",
"bucket": "mid",
"taxfree_metadata": {
"active_frames": [
"Music",
"Humor"
],
"frame_relationships": "The Music frame is used to deliver comedic content within the Humor frame.",
"extraction_orientation": "Look for lyrics or song details that provide a deeper understanding of the comedic narrative.",
"one_sentence_summary": "The document discusses a Lonely Island track, 'Perfect Saturday', which is a comedic musical number about a poop-related incident during a sexual encounter."
},
"standard_metadata": {
"language": "en",
"char_length": 1069,
"primary_format": "mixed",
"structural_signals": {
"has_headings": false,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": true
},
"content_signals": {
"has_named_people": true,
"has_institutional_language": false,
"has_technical_terminology": false,
"has_first_person": false,
"has_quotations": false
},
"domain_class": "conversational",
"one_sentence_summary": "A conversation about finding a specific skit from Lonely Island's albums 'Turtleneck & Chain', 'The Wack Album', or 'Incredibad'"
}
},
{
"name": "ChatGPT: Parse Tidal playlist",
"bucket": "mid",
"taxfree_metadata": {
"active_speaker": "Assistant",
"finetuned_response": {
"source_language": "en",
"target_language": "en",
"dialog_id": 412769058,
"generated_utts": [
{
"role": "Assistant",
"text": "The follow-up playlist for your 80s night has been carefully curated with 25 more danceable tracks that maintain the same vibe as your original list. Here it is:\n\n## \ud83e\udea9 25 More Danceable '80s Tracks (Alt-Club Vibe, Fits Your Original Playlist)\n### \ud83d\udd25 Synthpop / New Wave / Dance-Rock:\n1. **Alphaville \u2013 Forever Young**\n2. **Depeche Mode \u2013 Enjoy the Silence**\n3. **Tears for Fears \u2013 Shout** *(club remix)*\n4. **OMD \u2013 If You Leave**\n5. **The Human League \u2013 Love Action (I Believe in Love)**\n6. **Men Without Hats \u2013 Safety Dance**\n7. **Culture Club \u2013 Time (Clock of the Heart)**\n8. **A Flock of Seagulls \u2013 I Ran (So Far Away)** *(extended 12\u201d version)*\n9. **The Police \u2013 Don't Stand So Close to Me**\n10. **Pet Shop Boys \u2013 It's a Sin**"
},
{
"role": "Assistant",
"text": "### \ud83d\udc83 Funky Post-Punk / Art-Disco Bangers:\n11. **The Stranglers \u2013 Golden Brown**\n12. **Salt-N-Pepa \u2013 Push It** *(early hip hop infused with disco)*\n13. **Chic \u2013 Le Freak**\n14. **Rick James \u2013 Super Freak**\n15. **The Buggles \u2013 Video Killed the Radio Star** *(early MTV staple)*"
},
{
"role": "Assistant",
"text": "### \ud83e\uddca Sleek & Cool Euro-Dance / Underground Synth:\n16. **Kraftwerk \u2013 The Model**\n17. **Japan \u2013 Ghosts** *(haunting, synthpop ballad)*\n18. **New Order \u2013 Blue Monday (Extended 12\u201d Version)** *(one of the longest running UK singles)*\n19. **Soft Cell \u2013 Tainted Love** *(classic remake)*\n20. **Yazoo \u2013 Only You**"
},
{
"role": "Assistant",
"text": "### \ud83c\udf00 Optional Bonus Vibes (For future expansion)\n- **Thompson Twins \u2013 Hold Me Now** *(power ballad)*\n- **ABC \u2013 The Look of Love** *(disco-infused synthpop)*\n- **Simple Minds \u2013 Alive and Kicking** *(anthemic, uplifting)*"
}
]
}
},
"standard_metadata": {
"error": "parse_failed",
"raw": "{\n\"query_id\": \"4b6a7e10-c39d-481f-ae4a-79e3ba6c4cdd\",\n\"results\": [\n {\n \"answer\": \"Sure, I can provide another 25 songs in the same flavor that leans more towards a darker, sexier after-midni"
}
},
{
"name": "NO thesis proposal.pdf",
"bucket": "document",
"taxfree_metadata": {
"active_frames": [
"Artist",
"Career Progression",
"Identity",
"Personal Interests",
"Product Design"
],
"frame_relationships": "The artist's career progression is intertwined with their identity and personal interests, shaping the subject matter and style of their product designs.",
"extraction_orientation": "Focus on relationships between the artist's professional evolution, personal identity, and the creation process of their product designs.",
"one_sentence_summary": "The document discusses a graduate thesis proposal for a 3D modeler, focusing on creating whimsical products with specific subject matters: critters, fish, and poodles."
},
"standard_metadata": {
"language": "en",
"char_length": 602,
"primary_format": "prose",
"structural_signals": {
"has_headings": false,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": false
},
"content_signals": {
"has_named_people": true,
"has_institutional_language": false,
"has_technical_terminology": false,
"has_first_person": true,
"has_quotations": false
},
"domain_class": "personal",
"one_sentence_summary": "The document discusses an artist's graduate thesis proposal for a project centered around creating whimsical product designs featuring critters, fish, and poodles."
}
},
{
"name": "PWM.pdf",
"bucket": "document",
"taxfree_metadata": {
"active_frames": [
"Pulse Width Modulation (PWM)",
"Analog to Digital Conversion",
"Arduino ADC"
],
"frame_relationships": "The PWM and Analog to Digital Conversion frames are directly related as they both discuss the principles and applications of PWM in relation to analog-to-digital conversion, while the Arduino ADC frame provides specific context regarding the use of these concepts with an Arduino microcontroller.",
"extraction_orientation": "Look for relationships between PWM and its parameters (time, voltage levels) and their impact on Analog to Digital Conversion resolution and Arduino ADC functions",
"one_sentence_summary": "This document discusses the principles of Pulse Width Modulation, its implementation in Arduino ADC, and the relationship between PWM and analog-to-digital conversion."
},
"standard_metadata": {
"language": "en",
"char_length": 427,
"primary_format": "prose",
"structural_signals": {
"has_headings": false,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": false
},
"content_signals": {
"has_named_people": false,
"has_institutional_language": true,
"has_technical_terminology": true,
"has_first_person": false,
"has_quotations": false
},
"domain_class": "educational",
"one_sentence_summary": "The document discusses Pulse Width Modulation (PWM) and Analog to Digital Conversion in the context of Arduino."
}
},
{
"name": "Will_It_Print.pdf",
"bucket": "document",
"taxfree_metadata": {
"active_frames": [
"Part Design",
"Manufacturing Process",
"Material Removal",
"Surface Finish",
"Support Structures",
"Overhang Features",
"Internal Cavities",
"Tolerances",
"Stress Concentration"
],
"frame_relationships": "The document discusses the design and manufacturing of a part, focusing on its features, material removal, surface finish, support structures, overhangs, internal cavities, tolerances, and stress concentration.",
"extraction_orientation": "Focus on the relationships between the part's design, manufacturing process, and associated features such as overhangs, internal cavities, tolerances, and stress concentration.",
"one_sentence_summary": "This document provides instructions for reducing the number of printing and prototyping failures by Joran Booth, focusing on various aspects of part design and manufacturing."
},
"standard_metadata": {
"language": "en",
"char_length": 803,
"primary_format": "structured",
"structural_signals": {
"has_headings": true,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": false
},
"content_signals": {
"has_named_people": false,
"has_institutional_language": false,
"has_technical_terminology": true,
"has_first_person": false,
"has_quotations": false
},
"domain_class": "technical",
"one_sentence_summary": "This document provides instructions for reducing the number of printing and prototyping failures by Joran Booth for each category of a part to be printed"
}
},
{
"name": "Kim Kedem Ind Study F2025 Syllabus.docx",
"bucket": "document",
"taxfree_metadata": {
"active_frames": [
"Education",
"Project",
"Software Development",
"3D Printing"
],
"frame_relationships": "The Education frame serves as the context for the Project and Software Development frames, with the 3D Printing frame acting as a specific application of these skills.",
"extraction_orientation": "A knowledge graph extractor should focus on relationships between educational concepts, project goals, software development requirements, and 3D printing techniques.",
"one_sentence_summary": "This independent study outlines a project for the design and implementation of a custom 3D printing slicer in Rhino Grasshopper environment."
},
"standard_metadata": {
"language": "en",
"char_length": 1857,
"primary_format": "prose",
"structural_signals": {
"has_headings": true,
"has_bullet_lists": false,
"has_numbered_lists": false,
"has_tables": false,
"has_code_blocks": false,
"has_dates": true
},
"content_signals": {
"has_named_people": true,
"has_institutional_language": true,
"has_technical_terminology": true,
"has_first_person": false,
"has_quotations": false
},
"domain_class": "educational",
"one_sentence_summary": "This document outlines an independent study focused on designing and implementing a custom 3D printing slicer in the Rhino Grasshopper environment."
}
},
{
"name": "Aaron Nelson Graduate Transcript.pdf",
"bucket": "document",
"taxfree_metadata": {},
"standard_metadata": {
"Name": "Aaron Nelson",
"Student ID": "00917133",
"University": "University of Massachusetts Dartmouth",
"Address": "285 Old Westport Road N Dartmouth, MA 027472356",
"Degree Awarded": "Master of Fine Arts",
"Confer Date": "05/23/2010",
"Degree GPA": "3.885",
"Program of Study": {
"Artisanry - Jewelry/Metals": [
{
"Course": "Graduate Seminar I",
"Grade": "B",
"Credits": "3.00",
"Points": "9.000"
},
{
"Course": "Instructional Development",
"Grade": "B+",
"Credits": "3.00",
"Points": "9.900"
},
{
"Course": "Graduate Seminar II",
"Grade": "A-",
"Credits": "3.00",
"Points": "11.100"
},
{
"Course": "Graduate Standard I: Metals/Jewelry",
"Grade": "A",
"Credits": "9.00",
"Points": "36.000"
},
{
"Course": "Methods & Theory in Art History",
"Grade": "A",
"Credits": "3.00",
"Points": "12.000"
},
{
"Course": "Graduate Standard II: Metals/Jewelry",
"Grade": null,
"Credits": "9.00",
"Points": null
},
{
"Course": "Visual Thesis",
"Grade": null,
"Credits": "6.00",
"Points": null
},
{
"Course": "Written Thesis",
"Grade": null,
"Credits": "3.00",
"Points": null
},
{
"Course": "Independent Study (Arduino Microcontroller Basics)",
"Grade": "A",
"Credits": "6.00",
"Points": "24.000"
},
{
"Course": "Independent Study (Furniture Failing)",
"Grade": "A",
"Credits": "3.00",
"Points": "12.000"
},
{
"Course": "Visual Thesis (Continuation)",
"Grade": null,
"Credits": "6.00",
"Points": null
},
{
"Course": "Writing Seminar",
"Grade": "A-",
"Credits": "3.00",
"Points": "11.100"
},
{
"Course": "Thesis Report (Continuation)",
"Grade": null,
"Credits": "3.00",
"Points": null
},
{
"Course": "Transcript Note: Lessons in Friction and Torque or: How I learned to Stop Worrying and Love the Information Age (Continuation)",
"Grade": null,
"Credits": null,
"Points": null
}
]
},
"Non Credit Courses": [
{
"Course": "Metals Open Studio",
"Credits": null,
"Points": null
}
]
}
}
]
}