module DataScrubber

Private Instance Methods

get_input_lookup_table(dataset) click to toggle source
# File lib/cerebrum/data_scrubber.rb, line 10
def get_input_lookup_table(dataset)
  input_features = dataset.map { |ex| ex[:input] }
  (input_features.first.is_a? Array) ? nil : features_to_vector_index_lookup_table(input_features)
end
get_output_lookup_table(dataset) click to toggle source
# File lib/cerebrum/data_scrubber.rb, line 15
def get_output_lookup_table(dataset)
  output_features = dataset.map { |ex| ex[:output] }
  (output_features.first.is_a? Array) ? nil : features_to_vector_index_lookup_table(output_features)
end
scrub_dataset(dataset) click to toggle source
# File lib/cerebrum/data_scrubber.rb, line 4
def scrub_dataset(dataset)
  dataset = scrub_input(dataset) unless dataset[0][:input].is_a? Array
  dataset = scrub_output(dataset) unless dataset[0][:output].is_a? Array
  dataset
end
scrub_input(dataset) click to toggle source
# File lib/cerebrum/data_scrubber.rb, line 20
def scrub_input(dataset)
  input_lookup_table = get_input_lookup_table(dataset)
  dataset.each do |ex|
    ex[:input] = to_vector_given_features(ex[:input], input_lookup_table)
  end
end
scrub_output(dataset) click to toggle source
# File lib/cerebrum/data_scrubber.rb, line 27
def scrub_output(dataset)
  output_lookup_table = get_output_lookup_table(dataset)
  dataset.each do |ex|
    ex[:output] = to_vector_given_features(ex[:output], output_lookup_table)
  end
end