add base sourcecode

This commit is contained in:
Lukas Z 2022-07-25 22:29:53 +02:00
parent 79319cce2d
commit 19ceaca42b
2 changed files with 19 additions and 0 deletions

11
src/create_dataset.py Normal file
View file

@ -0,0 +1,11 @@
import pandas as pd
tweets_path = "../raw_data/tweets.csv"
tweets = pd.read_csv(tweets_path)
# TODO extract mentions from tweets
# TODO generate cooccurence matrix
# TODO save cooccurence matrix

8
src/create_id_list.py Normal file
View file

@ -0,0 +1,8 @@
import pandas as pd
tweets_path = "../raw_data/tweets.csv"
tweets = pd.read_csv(tweets_path)
for id in tweets.id:
print(id)