class Object

Public Instance Methods

both_classifications() click to toggle source
# File lib/definitions/classifications.rb, line 10
def both_classifications
  @both_classifications ||= classifications + non_regex_classifications
end
both_classifications_symboled() click to toggle source
# File lib/definitions/classifications.rb, line 14
def both_classifications_symboled
  both_classifications_symboled ||= both_classifications.map {|x| x.to_sym}
end
classifications() click to toggle source
# File lib/definitions/classifications.rb, line 2
def classifications
  @classifications ||= ["name", "phone", "email", "address", "section", "professions", "companies", "schools", "dates", "cities"]
end
header_classifications() click to toggle source
# File lib/definitions/classifications.rb, line 18
def header_classifications
  @header_classifications ||= ["professions", "companies", "schools", "dates", "cities"]
end
non_regex_classifications() click to toggle source
# File lib/definitions/classifications.rb, line 6
def non_regex_classifications
  non_regex_classifications ||= ["number_of_words", "many_words", "verbs", "text", "type", "id", "presume"]
end
regex_address() click to toggle source
# File lib/definitions/regex.rb, line 17
def regex_address
  @regex_address ||= Regexp.new("\\d (\\w{2,} ){1,2}(Alley|ALY|Annex|ANX|Arcade|ARC|Avenue|AVE|Bayou|YU|Beach|BCH|Bend|BND|Bluff|BLF|Bottom|BTM|Boulevard|BLVD|Branch|BR|Bridge|BRG|Brook|BRK|Burg|BG|Bypass|BYP|Camp|CP|Canyon|CYN|Cape|CPE|Causeway|CSWY|Center|CTR|Circle|CIR|Cliffs|CLFS|Club|CLB|Corner|COR|Corners|CORS|Course|CRSE|Court|CT|Courts|CTS|Cove|CV|Creek|CRK|Crescent|CRES|Crossing|XING|Dale|DL|Dam|DM|Divide|DV|Drive|DR|Estates|EST|Expressway|EXPY|Extension|EXT|Fall|FALL|Falls|FLS|Ferry|FRY|Field|FLD|Fields|FLDS|Flats|FLT|Ford|FOR|Forest|FRST|Forge|FGR|Fork|FORK|Forks|FRKS|Fort|FT|Freeway|FWY|Gardens|GDNS|Gateway|GTWY|Glen|GLN|Green|GN|Grove|GRV|Harbor|HBR|Haven|HVN|Heights|HTS|Highway|HWY|Hill|HL|Hills|HLS|Hollow|HOLW|Inlet|INLT|Island|IS|Islands|ISS|Isle|ISLE|Junction|JCT|Key|CY|Knolls|KNLS|Lake|LK|Lakes|LKS|Landing|LNDG|Lane|LN|Light|LGT|Loaf|LF|Locks|LCKS|Lodge|LDG|Loop|LOOP|Mall|MALL|Manor|MNR|Meadows|MDWS|Mill|ML|Mills|MLS|Mission|MSN|Mount|MT|Mountain|MTN|Neck|NCK|Orchard|ORCH|Oval|OVAL|Park|PARK|Parkway|PKY|Pass|PASS|Path|PATH|Pike|PIKE|Pines|PNES|Place|PL|Plain|PLN|Plains|PLNS|Plaza|PLZ|Point|PT|Port|PRT|Prairie|PR|Radial|RADL|Ranch|RNCH|Rapids|RPDS|Rest|RST|Ridge|RDG|River|RIV|Road|RD|Row|ROW|Run|RUN|Shoal|SHL|Shoals|SHLS|Shore|SHR|Shores|SHRS|Spring|SPG|Springs|SPGS|Spur|SPUR|Square|SQ|Station|STA|Stravenues|STRA|Stream|STRM|Street|ST|Summit|SMT|Terrace|TER|Trace|TRCE|Track|TRAK|Trail|TRL|Trailer|TRLR|Tunnel|TUNL|Turnpike|TPKE|Union|UN|Valley|VLY|Viaduct|VIA|View|VW|Village|VLG|Ville|VL|Vista|VIS|Walk|WALK|Way|WAY|Wells|WLS)(\\b|\\.\\b)", "i")
end
regex_characters_and_digits() click to toggle source
# File lib/definitions/regex.rb, line 73
def regex_characters_and_digits
  Regexp.new(/[A-Za-z]|\d/)
end
regex_cities() click to toggle source
# File lib/definitions/regex.rb, line 1
def regex_cities
  @regex_cities ||= Regexp.new("([a-z]{2,} ){0,3}[a-z]{2,}\\, " + "\\b(AK|Alaska|AL|Alabama|AR|Arkansas|AZ|Arizona|CA|California|CO|Colorado|CT|Connecticut|DE|Delaware|FL|Florida|GA|Georgia|HI|Hawaii|IA|Iowa|ID|Idaho|IL|Illinois|IN|Indiana|KS|Kansas|KY|Kentucky|LA|Louisiana|MA|Massachusetts|MD|Maryland|ME|Maine|MI|Michigan|MN|Minnesota|MO|Missouri|MS|Mississippi|MT|Montana|NC|North Carolina|ND|North Dakota|NE|Nebraska|NH|New Hampshire|NJ|New Jersey|NM|New Mexico|NV|Nevada|NY|New York|OH|Ohio|OK|Oklahoma|OR|Oregon|PA|Pennsylvania|RI|Rhode Island|SC|South Carolina|SD|South Dakota|TN|Tennessee|TX|Texas|UT|Utah|VA|Virginia|VT|Vermont|WA|Washington|WI|Wisconsin|WV|West Virginia|WY|Wyoming|AB|Alberta|BC|British Columbia|MB|Manitoba|NB|New Brunswick|NL|Newfoundland and Labrador|NS|Nova Scotia|ON|Ontario|PE|Prince Edward Island|QC|Quebec|SK|Saskatchewan)" + "\\b", "i")
end
regex_companies() click to toggle source
# File lib/definitions/regex.rb, line 13
def regex_companies
  @regex_companies ||= Regexp.new(/(([A-Z][a-z]* )*and ([A-Z][a-z]* )*|([A-Z][a-z]* )*)(Inc|INC|Corp|CORP|CO|Co|LTD|Ltd)\b(\.|)/)
end
regex_current() click to toggle source
# File lib/definitions/regex.rb, line 77
def regex_current
  @regex_current ||= Regexp.new('current|present|today', 'i')
end
regex_dates() click to toggle source
# File lib/definitions/regex.rb, line 29
def regex_dates
  @regex_dates ||= Regexp.union(regex_dates_1, regex_dates_2)
end
regex_dates_1() click to toggle source
# File lib/definitions/regex.rb, line 33
def regex_dates_1
  @regex_dates_1 ||= Regexp.new("((January|Jan|March|Mar|May|May|July|Jul|September|Sep|Sept|November|Nov|February|Feb|April|Apr|June|Jun|August|Aug|October|Oct|December|Dec|Winter|Fall|Summer|Spring)( |)(\\d{2}\\b|\\d{4}\\b)( |)(–|-|to)( |)((January|Jan|March|Mar|May|May|July|Jul|September|Sep|Sept|November|Nov|February|Feb|April|Apr|June|Jun|August|Aug|October|Oct|December|Dec|Winter|Fall|Summer|Spring)( |)(\\d{2}\\b|\\d{4}\\b)|present|current|today)|(January|Jan|March|Mar|May|May|July|Jul|September|Sep|Sept|November|Nov|February|Feb|April|Apr|June|Jun|August|Aug|October|Oct|December|Dec|Winter|Fall|Summer|Spring)( |)(\\d{2}\\b|\\d{4}\\b))", "i")
end
regex_dates_2() click to toggle source
# File lib/definitions/regex.rb, line 37
def regex_dates_2
  @regex_dates_2 ||= Regexp.new("((\\d{2}\\b)(| )(–|-|to)(| )(\\d{2}\\b|present\\b)|(\\d{4}\\b)(| )(–|-|to)(| )(\\d{4}\\b|present\\b))", "i")
end
regex_email() click to toggle source
# File lib/definitions/regex.rb, line 25
def regex_email
  @regex_email ||= Regexp.new("\\b(\\w){1,}@(\\w){1,}\\.(\\w){1,5}\\b", "i")
end
regex_engtagger_verbs() click to toggle source
# File lib/definitions/regex.rb, line 61
def regex_engtagger_verbs
  @regex_engtagger_verbs ||= Regexp.new(/<vb[a-z]{0,1}>/)
end
regex_month() click to toggle source
# File lib/definitions/regex.rb, line 41
def regex_month
  @regex_month ||= Regexp.new('January|Jan|March|Mar|May|May|July|Jul|September|Sep|Sept|November|Nov|February|Feb|April|Apr|June|Jun|August|Aug|October|Oct|December|Dec', 'i')    
end
regex_new_lines_and_blanks() click to toggle source
# File lib/definitions/regex.rb, line 57
def regex_new_lines_and_blanks
  @regex_new_lines ||= Regexp.new(/\n\n\n\n|\n\n\n|\n\n|\n|   /)
end
regex_phone() click to toggle source
# File lib/definitions/regex.rb, line 21
def regex_phone
  @regex_phone ||= Regexp.new("\\d\\d\\d(|\\))(| |-)(\\(|)\\d\\d\\d(|\\))(| |-)\\d\\d\\d\\d", "i")    
end
regex_professions() click to toggle source
# File lib/definitions/regex.rb, line 5
def regex_professions
  @regex_professions ||= Regexp.new('([A-Z][a-z]* ){0,5}(coordinator|assistant|asst|manager|director|technician|analyst|associate|developer|programmer|nurse|consutlant|worker|clerk|receptionist|secretary|teacher|engineer|administrator|researcher|head of|admin|intern|database|leader|server|waitress|waiter|busboy)\b(\.|)( [A-Z][a-z]*){0,5}', 'i')
end
regex_remove_extra_spaces() click to toggle source
# File lib/definitions/regex.rb, line 69
def regex_remove_extra_spaces
  @regex_remove_extra_spaces ||= Regexp.new('(?<=  ) ')
end
regex_schools() click to toggle source
# File lib/definitions/regex.rb, line 9
def regex_schools
  @regex_schools ||= Regexp.new("([a-z]{1,} ){0,5}(university|college)\\b(( [a-z]{1,}){0,5}|)", "i")
end
regex_season() click to toggle source
# File lib/definitions/regex.rb, line 45
def regex_season
  @regex_season ||= Regexp.new('Winter|Fall|Summer|Spring', 'i')
end
regex_section() click to toggle source
# File lib/definitions/regex.rb, line 53
def regex_section
  @regex_section ||= Regexp.new("([a-z]* ){0,5}(highlight|professional development|summary|experience|skills|education|qualifications|interests|profile)( [a-z]*){0,5}", "i")
end
regex_separate_tabbed_words() click to toggle source
# File lib/definitions/regex.rb, line 65
def regex_separate_tabbed_words
  @regex_separate_tabbed_words ||= Regexp.new('(?<=[A-Za-z])(?=\d)|(?<=[a-z])(?=[A-Z])|(?<=\d)(?=[A-Za-z])')
end
regex_year() click to toggle source
# File lib/definitions/regex.rb, line 49
def regex_year
  @regex_year ||= Regexp.new('\b\d\d\d\d\b|\b\d\d\b', 'i')
end
set_time_at_inception(time, presume) click to toggle source
# File lib/definitions/classifications.rb, line 22
def set_time_at_inception(time, presume)
  instance_variable_set("@#{time}", presume)
end
stemmed(word) click to toggle source
# File lib/definitions/machines.rb, line 9
def stemmed(word)
        stemmer.stem(word)
end
stemmer() click to toggle source
# File lib/definitions/machines.rb, line 5
def stemmer
        @stemmer ||= Lingua::Stemmer.new(:language => "en")
end
tgr() click to toggle source
# File lib/definitions/machines.rb, line 1
def tgr
        @tgr ||= EngTagger.new
end