• Jump To … +
    abbreviations.js adjectives.js convertables.js dates.js demonyms.js firstnames.js honourifics.js irregular_nouns.js irregular_verbs.js misc.js multiples.js numbers.js organisations.js phrasal_verbs.js places.js uncountables.js verbs.js fns.js index.js lexicon.js negate.js passive_voice.js contractions.js fancy_lumping.js grammar_rules.js parts_of_speech.js phrasal_verbs.js tagger.js word_rules.js question.js sentence.js statement.js tense.js adjective.js to_adverb.js to_comparative.js to_noun.js to_superlative.js adverb.js to_adjective.js is_acronym.js article.js date.js date_rules.js is_date.js parse_date.js is_plural.js is_uncountable.js noun.js is_organisation.js organisation.js gender.js is_person.js parse_name.js person.js is_place.js place.js pluralize.js pronoun.js singularize.js is_value.js numbers.js to_number.js units.js value.js term.js conjugate.js from_infinitive.js predict_form.js suffix_rules.js to_actor.js to_infinitive.js negate.js verb.js sentence_parser.js text.js
  • abbreviations.js

  • ¶

    these are common word shortenings used in the lexicon and sentence segmentation methods there are all nouns, or at the least, belong beside one.

    'use strict';
    const honourifics = require('./honourifics'); //stored seperately, for 'noun.is_person()'
  • ¶

    common abbreviations

    let main = [
      'arc', 'al', 'exp', 'rd', 'st', 'dist', 'mt', 'fy', 'pd', 'pl', 'plz', 'tce', 'llb', 'md', 'bl', 'ma', 'ba', 'lit',
      'ex', 'eg', 'ie', 'circa', 'ca', 'cca', 'vs', 'etc', 'esp', 'ft', 'bc', 'ad'
    ];
  • ¶

    person titles like ‘jr’, (stored seperately)

    main = main.concat(honourifics);
  • ¶

    org main

    let orgs = [
      'dept', 'univ', 'assn', 'bros', 'inc', 'ltd', 'co', 'corp',
  • ¶

    proper nouns with exclamation marks

      'yahoo', 'joomla', 'jeopardy'
    ];
    main = main.concat(orgs);
  • ¶

    place main

    let places = [
      'ala', 'ariz', 'ark', 'cal', 'calif', 'col', 'colo', 'conn', 'del', 'fed', 'fla', 'fl', 'ga', 'ida', 'ind', 'ia', 'la', 'kan', 'kans', 'ken', 'ky', 'la', 'md', 'mich', 'minn', 'mont', 'neb', 'nebr', 'nev', 'okla', 'penna', 'penn', 'pa', 'dak', 'tenn', 'tex', 'ut', 'vt', 'va', 'wash', 'wis', 'wisc', 'wy', 'wyo', 'usafa', 'alta', 'ont', 'que', 'sask', 'yuk',
      'ave', 'blvd', 'cl', 'ct', 'cres', 'hwy'
    ];
    main = main.concat(places);
  • ¶

    date abbrevs. these are added seperately because they are not nouns

    let dates = ['jan', 'feb', 'mar', 'apr', 'jun', 'jul', 'aug', 'sep', 'oct', 'nov', 'dec', 'sept', 'sep'];
    main = main.concat(dates);
    
    module.exports = {
      abbreviations: main,
      dates: dates,
      orgs: orgs,
      places: places
    };