Tokenisieren und Zählen
Aus einem Text werden mehrere Zeilen
RT @pugandcat: Whisker licking good food from @lilyskitchenrt pugandcat whisker licking good food from lilyskitchencreate or replace view tweets_words as
select user
,created_at
,split(text, ' ') as `words`
from tweets_cleaned["rt","pugandcat","whisker","licking","good","food","from","lilyskitchen"]-- Array von Wörtern in Zeilen zerlegen
select explode(words) as `word` from tweets_wordscreate or replace view tweets_words as
select id
,screen_name
,created_at
,lang
,posexplode(split(text, ' ')) as (position, word)
from tweets_cleanedLast updated