EMPH YAML source

code: EMPH
biber_number: K49
mfte_code: EMPH
bohmann_number: 87
name: Emphatics
definition: >-
  General emphatic markers: just, really, so + adjective, do + verb (emphatic do),
  etc.
normalization: words
detection:
- requires:
  - word
  - pos
  parts:
    p1:
      cql: '[word="most" & pos="DT"]'
    p2:
      cql: '[word="most"] [pos="JJ.*|VBN|VBG"]'
    p3:
      cql: '[word="real|dead|damn|super"] [pos="JJ.*|RB.*"]'
    p4:
      cql: '[word="really|truly|bloody|pretty|more"] [pos="JJ.*|RB.*|VB.*|MD"]'
    p5:
      cql: '[word="so"] [pos="JJ.*|RB.*"]'
    p6:
      cql: '[word="far|way" & pos!="NN.*"] [pos="JJ.*|RB.*"]'
    p7:
      cql: '[word="such"] [word="a|an"]'
    p8:
      cql: '[word="[Dd]o|[Dd]oes|[Dd]id" & pos="VB.*"] [pos="VB"]'
  combine: "p1 | p2 | p3 | p4 | p5 | p6 | p7 | p8"
  refines: RB
  description: >-
    Default emphatics rule (based on MFTE): context-dependent patterns.
    Refines RB for tag refinement architecture.
- source: pybiber
  requires:
  - word
  - pos
  parts:
    p1:
      cql: '[word="just|really|most|more"]'
    p2:
      cql: '[word="so"] [pos="JJ.*"]'
    p3:
      cql: '[word="real"] [pos="JJ.*"]'
    p4:
      cql: '[word="such"] [word="a"]'
    p5:
      cql: '[word="a"] [word="lot"]'
    p6:
      cql: '[word="for"] [word="sure"]'
    p7:
      cql: '[word="do|does|did|doing" & pos="VB.*"] [pos="VB.*"]'
  combine: "p1 | p2 | p3 | p4 | p5 | p6 | p7"
  description: >-
    pybiber's emphatic patterns: simple words (no POS filter),
    so/real + adjective, multi-word expressions, emphatic do + verb.
- source: mfte
  requires:
  - word
  - pos
  parts:
    p1:
      cql: '[word="most" & pos="DT"]'
    p2:
      cql: '[word="most"] [pos="JJ.*|VBN|VBG"]'
    p3:
      cql: '[word="real|dead|damn|super"] [pos="JJ.*|RB.*"]'
    p4:
      cql: '[word="really|truly|bloody|pretty|more"] [pos="JJ.*|RB.*|VB.*|MD"]'
    p5:
      cql: '[word="so"] [pos="JJ.*|RB.*"]'
    p6:
      cql: '[word="far|way" & pos!="NN.*"] [pos="JJ.*|RB.*"]'
    p7:
      cql: '[word="such"] [word="a|an"]'
    p8:
      cql: '[word="[Dd]o|[Dd]oes|[Dd]id" & pos="VB.*"] [pos="VB"]'
  combine: "p1 | p2 | p3 | p4 | p5 | p6 | p7 | p8"
  refines: RB
  description: >-
    MFTE emphatics: all context-dependent. Most/dead/damn/real/super
    before adjective or adverb. Really/truly/bloody/pretty/more before
    adj/adv/verb. So before adjective. Far/way before adj/adv (not
    "so/thus far", not "away"). Such before a/an. Emphatic do counted
    separately via DOAUX tag.
sources:
- biber_1988
- mfte
- pybiber
- grieve_2023
- bohmann_2019
examples:
- text: I _do_ wish I hadn't drunk quite _so_ much.
  source: le_foll_2024
- text: Oh _really_?
  source: le_foll_2024
- text: I _just_ can't get my head around it.
  source: le_foll_2024