The London Perl and Raku Workshop takes place on 26th Oct 2024. If your company depends on Perl, please consider sponsoring and/or attending.
# Copyright (C) 2004 Jörg Tiedemann  <joerg@stp.ling.uu.se>
{
  'encoding' => 'iso-8859-1',
  'default' => {
    'stop words' => {
      'classes' => [
      ],
    },
    'character specifications' => {
     'upper case letter' => 'A-ZÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝ',
      'lower case letter' => 'a-zàáâãäåæçèéêëìíîïðñòóôõöøùúûüý',
      'hyphen' => '\- ',
      'punctuation' => '\.\!\?\¿\,\:\;',
      'digit' => '0-9',
      'closing parantheses' => '\)\]\}',
      'opening parantheses' => '\(\[\{',
      'numeric symbol' => '\.\,E\^\%\+\-\<\>\*\=\/\(\)\[\]\{\}\±\¹\²\³\÷\:\¼\½\¾ ',
      'numeric' => '0-9\.\,E\^\%\+\-\<\>\*\=\/\(\)\[\]\{\}\±\¹\²\³\÷\:\¼\½\¾ ',
      'parantheses' => '\)\]\}\(\[\{',
      'vowel' => 'AEIOUÀÁÂÃÄÅÆÈÉÊËÌÍÎÏÒÓÔÕÖØÙÚÛÜÝaeiouàáâãäåæèéêëìíîïòóôõöøùúûüý',
      'token delimiter' => '\.\!\?\¿\,\:\;\\\'\"\(\[\{\)\]\}\|\/',
      'special symbol' => '\#\$\%\&\@\^\`\~\¡\¢\£\¤\¥\¦\§\¨\©\ª\«\¬\®\°\´\µ\¶\¸\º\»\þ',
      'sentence delimiter' => '\.\!\?\¿',
      'consonant' => 'BCDFGHJKLMNPQRSTVWXYZÇÐÑbcdfghjklmnpqrstvwxyzçð',
      'letter' => 'A-ZÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝa-zàáâãäåæçèéêëìíîïðñòóôõöøùúûüý',
      'quotation' => "'".'"',
      'special alphanumeric symbol' => '\_'
    },
    'phrases' => {
      'skip phrase at string type' => [
        'numeric',
	'punctuation',
	'parantheses',
	'special symbol',
      ],
      'skip token' => [
        ',','.',';',':','-','/','(','[','{',')',']','}',"\\",
	'!','?','+','*','#','"',"'",'...','--'
      ],
      'skip phrase after' => [
      ],
      'skip phrase at' => [
      ],
      'skip phrase before' => [
      ],
      'non-phrase-starter' => [
      ],
      'non-phrase-ender' => [
      ],
    },
  }
}