spec:
  id: 449e018e-a624-460b-b00c-2d1b7ccf800f
  name: Gutenberg spec claude
  description: ''
  datasetId: a526fbae-80e5-4459-b4fb-75e4eb9b15e0
  datasetName: Gutenberg
  requirements: The data point must be a complete classic novel or book text in plain text format. It must begin with the book's title and author name. It must include a 'Contents' section that lists all chapters. The text must be divided into multiple numbered chapters, each with its own title. Each chapter must contain the full chapter text. The book must be a work of fiction resembling those from the Project Gutenberg collection. The text must end with Project Gutenberg end-of-book notices including copyright and distribution information.
  spec_version: '3'
  data_property_variations:
    - base_distributions:
        Arthur Conan Doyle: 7
        Bram Stoker: 6
        Charles Dickens: 7
        Edgar Allan Poe: 6
        H. G. Wells: 10
        Herman Melville: 5
        Jack London: 10
        Jane Austen: 5
        Joseph Conrad: 4
        Jules Verne: 8
        Mark Twain: 8
        Mary Shelley: 6
        Oscar Wilde: 6
        Robert Louis Stevenson: 7
        Rudyard Kipling: 5
      conditional_distributions: {}
      property_name: Author name
      property_values:
        - Jack London
        - H. G. Wells
        - Mark Twain
        - Jules Verne
        - Robert Louis Stevenson
        - Arthur Conan Doyle
        - Edgar Allan Poe
        - Mary Shelley
        - Bram Stoker
        - Oscar Wilde
        - Charles Dickens
        - Jane Austen
        - Herman Melville
        - Rudyard Kipling
        - Joseph Conrad
    - base_distributions:
        A Tale of Two Cities: 7
        Adventures of Huckleberry Finn: 7
        Dracula: 7
        Frankenstein: 7
        Heart of Darkness: 6
        The Call of the Wild: 7
        The Invisible Man: 6
        The Jungle Book: 6
        The Picture of Dorian Gray: 6
        The Strange Case of Dr. Jekyll and Mr. Hyde: 6
        The Time Machine: 7
        The War of the Worlds: 7
        Treasure Island: 7
        Twenty Thousand Leagues Under the Sea: 7
        White Fang: 7
      conditional_distributions: {}
      property_name: Book title
      property_values:
        - The Call of the Wild
        - The Time Machine
        - White Fang
        - The War of the Worlds
        - The Invisible Man
        - Adventures of Huckleberry Finn
        - Twenty Thousand Leagues Under the Sea
        - Treasure Island
        - The Strange Case of Dr. Jekyll and Mr. Hyde
        - Dracula
        - Frankenstein
        - The Picture of Dorian Gray
        - Heart of Darkness
        - The Jungle Book
        - A Tale of Two Cities
    - base_distributions:
        10 chapters: 15
        12 chapters: 15
        15 chapters: 12
        16 chapters: 10
        20 chapters: 10
        24 chapters: 8
        28 chapters: 6
        30 chapters: 4
        5 chapters: 8
        7 chapters: 12
      conditional_distributions: {}
      property_name: Number of chapters
      property_values:
        - 5 chapters
        - 7 chapters
        - 10 chapters
        - 12 chapters
        - 15 chapters
        - 16 chapters
        - 20 chapters
        - 24 chapters
        - 28 chapters
        - 30 chapters
    - base_distributions:
        Arabic numerals with 'Chapter' prefix: 20
        Mixed format with both numbers and descriptive titles: 15
        Roman numerals (I, II, III, etc.): 25
        Roman numerals with 'Chapter' prefix and period: 15
        Spelled out ordinal numbers (Chapter I., Chapter II., etc.): 25
      conditional_distributions: {}
      property_name: Chapter numbering format
      property_values:
        - Roman numerals (I, II, III, etc.)
        - Spelled out ordinal numbers (Chapter I., Chapter II., etc.)
        - Arabic numerals with 'Chapter' prefix
        - Roman numerals with 'Chapter' prefix and period
        - Mixed format with both numbers and descriptive titles
    - base_distributions:
        Epistolary (letters/diary entries): 4
        First person frame narrative with embedded story: 20
        First person narrator recounting events: 25
        Multiple first-person narrators: 6
        Third person limited: 15
        Third person omniscient following a single protagonist: 30
      conditional_distributions: {}
      property_name: Primary narrative perspective
      property_values:
        - Third person omniscient following a single protagonist
        - First person narrator recounting events
        - First person frame narrative with embedded story
        - Third person limited
        - Multiple first-person narrators
        - Epistolary (letters/diary entries)
    - base_distributions:
        Adventure novel: 15
        Dystopian fiction: 7
        Gothic horror: 10
        Historical fiction: 10
        Mystery/Detective fiction: 10
        Philosophical fiction: 3
        Romantic adventure: 5
        Science fiction: 12
        Sea adventure: 8
        Social commentary fiction: 5
        Supernatural thriller: 7
        Wilderness survival: 8
      conditional_distributions: {}
      property_name: Literary genre/category
      property_values:
        - Adventure novel
        - Science fiction
        - Gothic horror
        - Mystery/Detective fiction
        - Historical fiction
        - Sea adventure
        - Wilderness survival
        - Dystopian fiction
        - Supernatural thriller
        - Romantic adventure
        - Social commentary fiction
        - Philosophical fiction
    - base_distributions:
        Adult male professional (doctor, detective, etc.): 18
        Animal protagonist with anthropomorphized thoughts: 10
        Child or adolescent protagonist: 10
        Ensemble cast with no single protagonist: 7
        Female protagonist: 12
        Male human scientist or explorer: 20
        Supernatural or non-human entity: 5
        Young male adventurer: 18
      conditional_distributions: {}
      property_name: Protagonist type
      property_values:
        - Animal protagonist with anthropomorphized thoughts
        - Male human scientist or explorer
        - Young male adventurer
        - Adult male professional (doctor, detective, etc.)
        - Female protagonist
        - Child or adolescent protagonist
        - Ensemble cast with no single protagonist
        - Supernatural or non-human entity
    - base_distributions:
        18th century historical: 10
        American frontier/Wild West era: 8
        Distant future: 15
        Late 19th century contemporary (1880s-1900): 25
        Medieval or ancient past: 8
        Near future or speculative present: 15
        Prehistoric or primordial times: 4
        Timeless/mythological setting: 3
        Victorian era (1830s-1880s): 12
      conditional_distributions: {}
      property_name: Primary setting time period
      property_values:
        - Late 19th century contemporary (1880s-1900)
        - Near future or speculative present
        - Distant future
        - 18th century historical
        - Medieval or ancient past
        - Victorian era (1830s-1880s)
        - American frontier/Wild West era
        - Prehistoric or primordial times
        - Timeless/mythological setting
    - base_distributions:
        Arctic or polar region: 8
        Isolated estate or mansion: 10
        Multiple varied locations: 10
        Remote island: 8
        Sea/ocean voyage: 12
        Small village or countryside: 9
        Tropical or exotic locale: 8
        Underground/subterranean location: 5
        Urban Victorian setting (London, Paris, etc.): 15
        Wilderness/frontier (forests, tundra, etc.): 15
      conditional_distributions: {}
      property_name: Primary setting location type
      property_values:
        - Wilderness/frontier (forests, tundra, etc.)
        - Urban Victorian setting (London, Paris, etc.)
        - Sea/ocean voyage
        - Isolated estate or mansion
        - Remote island
        - Underground/subterranean location
        - Arctic or polar region
        - Tropical or exotic locale
        - Small village or countryside
        - Multiple varied locations
    - base_distributions:
        Has epilogue: 25
        No epilogue: 75
      conditional_distributions: {}
      property_name: Presence of epilogue
      property_values:
        - Has epilogue
        - No epilogue
    - base_distributions:
        Has prologue or introduction: 30
        No prologue or introduction: 70
      conditional_distributions: {}
      property_name: Presence of prologue or introduction chapter
      property_values:
        - Has prologue or introduction
        - No prologue or introduction
    - base_distributions:
        Character name titles: 10
        Descriptive phrase titles (e.g., 'Into the Primitive', 'The Law of Club and Fang'): 40
        Location-based titles: 10
        Mixed style with some chapters having titles and others not: 5
        Numbered only without descriptive titles: 10
        Question-based titles: 10
        Single word titles: 15
      conditional_distributions: {}
      property_name: Chapter title style
      property_values:
        - Descriptive phrase titles (e.g., 'Into the Primitive', 'The Law of Club and Fang')
        - Question-based titles
        - Single word titles
        - Character name titles
        - Location-based titles
        - Numbered only without descriptive titles
        - Mixed style with some chapters having titles and others not
    - base_distributions:
        100,000-150,000 words (long novel): 10
        150,000+ words (epic novel): 5
        30,000-50,000 words (novella): 20
        50,000-70,000 words (short novel): 35
        70,000-100,000 words (standard novel): 30
      conditional_distributions: {}
      property_name: Approximate total word count
      property_values:
        - 30,000-50,000 words (novella)
        - 50,000-70,000 words (short novel)
        - 70,000-100,000 words (standard novel)
        - 100,000-150,000 words (long novel)
        - 150,000+ words (epic novel)
    - base_distributions:
        Class struggle and social inequality: 8
        Good vs. evil moral conflict: 10
        Identity and transformation: 10
        Imperialism and colonialism: 5
        Isolation and human connection: 7
        Love and sacrifice: 7
        Mortality and immortality: 3
        Nature vs. civilization conflict: 10
        Revenge and justice: 8
        Scientific discovery and its consequences: 10
        Survival and adaptation to harsh environments: 12
        Time, progress, and evolution: 10
      conditional_distributions: {}
      property_name: Central themes
      property_values:
        - Survival and adaptation to harsh environments
        - Nature vs. civilization conflict
        - Time, progress, and evolution
        - Scientific discovery and its consequences
        - Good vs. evil moral conflict
        - Class struggle and social inequality
        - Identity and transformation
        - Revenge and justice
        - Love and sacrifice
        - Isolation and human connection
        - Imperialism and colonialism
        - Mortality and immortality
    - base_distributions:
        Episodic structure with varying pace: 15
        Fast-paced action-driven narrative: 25
        Gradually escalating tension throughout: 10
        Moderate pace with balanced action and reflection: 35
        Slower contemplative pace with philosophical digressions: 15
      conditional_distributions: {}
      property_name: Narrative pacing style
      property_values:
        - Fast-paced action-driven narrative
        - Moderate pace with balanced action and reflection
        - Slower contemplative pace with philosophical digressions
        - Episodic structure with varying pace
        - Gradually escalating tension throughout
    - base_distributions:
        Dialect or vernacular speech heavily featured: 10
        Frame narrative with dialogue in outer story only: 10
        Heavy use of dialogue throughout: 20
        Minimal dialogue, mostly narrative: 20
        Moderate dialogue mixed with narrative description: 40
      conditional_distributions: {}
      property_name: Use of dialogue
      property_values:
        - Heavy use of dialogue throughout
        - Moderate dialogue mixed with narrative description
        - Minimal dialogue, mostly narrative
        - Frame narrative with dialogue in outer story only
        - Dialect or vernacular speech heavily featured
  selected_sql_schema_column: null
  selected_sql_query_columns: []
  createdAt: '2026-01-08'
  updatedAt: '2026-01-09'
