Slide 73
Slide 73 text
code
Preprocess 2/3
PROCESSING STREAMING DATA AT A LARGE SCALE WITH KAFKA
23 consumer.each_message do |message|
24 # We've received a message, parse the log line
25 log_line = parse(log_line_regex, geo_ip, message)
26
35 # Convert it to an intermediary format
36 page_view = {
37 'time' => log_line[2],
38 'ip' => log_line[1],
39 'country' => city.country_name,
40 'browser' => user_agent.browser,
41 'url' => url
42 }